Repository: browserbase/stagehand
Branch: main
Commit: 2e99c9d9814e
Files: 799
Total size: 4.9 MB

Directory structure:
gitextract_8uatdfoc/

├── .changeset/
│   ├── config.json
│   └── crazy-nights-prove.md
├── .cursorrules
├── .github/
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.md
│   │   └── feature_request.md
│   ├── actions/
│   │   ├── select-browserbase-region/
│   │   │   └── action.yml
│   │   ├── setup-node-pnpm-turbo/
│   │   │   └── action.yml
│   │   ├── upload-ctrf-report/
│   │   │   └── action.yml
│   │   ├── upload-v8-coverage/
│   │   │   └── action.yml
│   │   └── verify-chromium-launch/
│   │       └── action.yml
│   ├── pull_request_template
│   └── workflows/
│       ├── ci.yml
│       ├── claude.yml
│       ├── external-contributor-pr-approval-handoff.yml
│       ├── external-contributor-pr.yml
│       ├── feature-parity.yml
│       ├── release.yml
│       ├── stagehand-server-v3-release.yml
│       ├── stagehand-server-v3-sea-build.yml
│       ├── stagehand-server-v4-release.yml
│       ├── stagehand-server-v4-sea-build.yml
│       └── stainless.yml
├── .gitignore
├── .prettierignore
├── .prettierrc
├── .vscode/
│   └── settings.json
├── CHANGELOG.md
├── LICENSE
├── README.md
├── claude.md
├── eslint.config.mjs
├── package.json
├── packages/
│   ├── README.md
│   ├── cli/
│   │   ├── CHANGELOG.md
│   │   ├── README.md
│   │   ├── package.json
│   │   ├── src/
│   │   │   └── index.ts
│   │   ├── tests/
│   │   │   ├── cli.test.ts
│   │   │   └── mode.test.ts
│   │   ├── tsconfig.json
│   │   ├── tsup.config.ts
│   │   └── vitest.config.ts
│   ├── core/
│   │   ├── CHANGELOG.md
│   │   ├── README.md
│   │   ├── examples/
│   │   │   ├── 2048.ts
│   │   │   ├── CHANGELOG.md
│   │   │   ├── actionable_observe_example.ts
│   │   │   ├── agent-custom-tools.ts
│   │   │   ├── agent_stream_example.ts
│   │   │   ├── cua-example.ts
│   │   │   ├── custom_client_aisdk.ts
│   │   │   ├── custom_client_langchain.ts
│   │   │   ├── custom_client_openai.ts
│   │   │   ├── example.ts
│   │   │   ├── external_clients/
│   │   │   │   ├── aisdk.ts
│   │   │   │   ├── customOpenAI.ts
│   │   │   │   └── langchain.ts
│   │   │   ├── form_filling_sensible.ts
│   │   │   ├── google_enter.ts
│   │   │   ├── instructions.ts
│   │   │   ├── integrations/
│   │   │   │   ├── exa.ts
│   │   │   │   └── supabase.ts
│   │   │   ├── mcp.ts
│   │   │   ├── operator-example.ts
│   │   │   ├── oss-cua-example.ts
│   │   │   ├── parameterizeApiKey.ts
│   │   │   ├── persist_logs_example.ts
│   │   │   ├── tsconfig.json
│   │   │   ├── v3/
│   │   │   │   ├── cuaReplay.ts
│   │   │   │   ├── deepLocator.ts
│   │   │   │   ├── dropdown.ts
│   │   │   │   ├── highlight.ts
│   │   │   │   ├── patchright.ts
│   │   │   │   ├── playwright.ts
│   │   │   │   ├── puppeteer.ts
│   │   │   │   ├── recordVideo.ts
│   │   │   │   ├── returnXpath.ts
│   │   │   │   ├── shadowRoot.ts
│   │   │   │   ├── targetedExtract.ts
│   │   │   │   └── v3_agent.ts
│   │   │   ├── v3_example.ts
│   │   │   └── wordle.ts
│   │   ├── lib/
│   │   │   ├── CHANGELOG.md
│   │   │   ├── inference.ts
│   │   │   ├── inferenceLogUtils.ts
│   │   │   ├── logger.ts
│   │   │   ├── modelUtils.ts
│   │   │   ├── prompt.ts
│   │   │   ├── utils.ts
│   │   │   ├── v3/
│   │   │   │   ├── agent/
│   │   │   │   │   ├── AgentClient.ts
│   │   │   │   │   ├── AgentProvider.ts
│   │   │   │   │   ├── AnthropicCUAClient.ts
│   │   │   │   │   ├── GoogleCUAClient.ts
│   │   │   │   │   ├── MicrosoftCUAClient.ts
│   │   │   │   │   ├── OpenAICUAClient.ts
│   │   │   │   │   ├── prompts/
│   │   │   │   │   │   └── agentSystemPrompt.ts
│   │   │   │   │   ├── tools/
│   │   │   │   │   │   ├── README.md
│   │   │   │   │   │   ├── act.ts
│   │   │   │   │   │   ├── ariaTree.ts
│   │   │   │   │   │   ├── braveSearch.ts
│   │   │   │   │   │   ├── browserbaseSearch.ts
│   │   │   │   │   │   ├── click.ts
│   │   │   │   │   │   ├── clickAndHold.ts
│   │   │   │   │   │   ├── dragAndDrop.ts
│   │   │   │   │   │   ├── extract.ts
│   │   │   │   │   │   ├── fillFormVision.ts
│   │   │   │   │   │   ├── fillform.ts
│   │   │   │   │   │   ├── goto.ts
│   │   │   │   │   │   ├── index.ts
│   │   │   │   │   │   ├── keys.ts
│   │   │   │   │   │   ├── navback.ts
│   │   │   │   │   │   ├── screenshot.ts
│   │   │   │   │   │   ├── scroll.ts
│   │   │   │   │   │   ├── think.ts
│   │   │   │   │   │   ├── type.ts
│   │   │   │   │   │   └── wait.ts
│   │   │   │   │   └── utils/
│   │   │   │   │       ├── actionMapping.ts
│   │   │   │   │       ├── captchaSolver.ts
│   │   │   │   │       ├── coordinateNormalization.ts
│   │   │   │   │       ├── cuaKeyMapping.ts
│   │   │   │   │       ├── googleCustomToolHandler.ts
│   │   │   │   │       ├── handleDoneToolCall.ts
│   │   │   │   │       ├── imageCompression.ts
│   │   │   │   │       ├── messageProcessing.ts
│   │   │   │   │       ├── screenshotHandler.ts
│   │   │   │   │       ├── validateExperimentalFeatures.ts
│   │   │   │   │       ├── variables.ts
│   │   │   │   │       └── xpath.ts
│   │   │   │   ├── api.ts
│   │   │   │   ├── cache/
│   │   │   │   │   ├── ActCache.ts
│   │   │   │   │   ├── AgentCache.ts
│   │   │   │   │   ├── CacheStorage.ts
│   │   │   │   │   ├── serverAgentCache.ts
│   │   │   │   │   └── utils.ts
│   │   │   │   ├── cli.js
│   │   │   │   ├── dom/
│   │   │   │   │   ├── a11yScripts/
│   │   │   │   │   │   └── index.ts
│   │   │   │   │   ├── genA11yScripts.ts
│   │   │   │   │   ├── genDomScripts.ts
│   │   │   │   │   ├── genLocatorScripts.ts
│   │   │   │   │   ├── genScreenshotScripts.ts
│   │   │   │   │   ├── global.d.ts
│   │   │   │   │   ├── index.ts
│   │   │   │   │   ├── locatorScripts/
│   │   │   │   │   │   ├── counts.ts
│   │   │   │   │   │   ├── index.ts
│   │   │   │   │   │   ├── scripts.ts
│   │   │   │   │   │   ├── selectors.ts
│   │   │   │   │   │   ├── waitForSelector.ts
│   │   │   │   │   │   ├── xpathParser.ts
│   │   │   │   │   │   └── xpathResolver.ts
│   │   │   │   │   ├── piercer.entry.ts
│   │   │   │   │   ├── piercer.runtime.ts
│   │   │   │   │   ├── rerenderMissingShadows.entry.ts
│   │   │   │   │   ├── rerenderMissingShadows.runtime.ts
│   │   │   │   │   └── screenshotScripts/
│   │   │   │   │       ├── index.ts
│   │   │   │   │       └── resolveMaskRect.ts
│   │   │   │   ├── external_clients/
│   │   │   │   │   ├── aisdk.ts
│   │   │   │   │   └── customOpenAI.ts
│   │   │   │   ├── flowlogger/
│   │   │   │   │   ├── EventEmitter.ts
│   │   │   │   │   ├── EventSink.ts
│   │   │   │   │   ├── EventStore.ts
│   │   │   │   │   ├── FlowLogger.ts
│   │   │   │   │   └── prettify.ts
│   │   │   │   ├── handlers/
│   │   │   │   │   ├── actHandler.ts
│   │   │   │   │   ├── extractHandler.ts
│   │   │   │   │   ├── handlerUtils/
│   │   │   │   │   │   ├── actHandlerUtils.ts
│   │   │   │   │   │   └── timeoutGuard.ts
│   │   │   │   │   ├── observeHandler.ts
│   │   │   │   │   ├── v3AgentHandler.ts
│   │   │   │   │   └── v3CuaAgentHandler.ts
│   │   │   │   ├── index.ts
│   │   │   │   ├── launch/
│   │   │   │   │   ├── browserbase.ts
│   │   │   │   │   └── local.ts
│   │   │   │   ├── llm/
│   │   │   │   │   ├── AnthropicClient.ts
│   │   │   │   │   ├── CerebrasClient.ts
│   │   │   │   │   ├── GoogleClient.ts
│   │   │   │   │   ├── GroqClient.ts
│   │   │   │   │   ├── LLMClient.ts
│   │   │   │   │   ├── LLMProvider.ts
│   │   │   │   │   ├── OpenAIClient.ts
│   │   │   │   │   └── aisdk.ts
│   │   │   │   ├── logger.ts
│   │   │   │   ├── mcp/
│   │   │   │   │   ├── connection.ts
│   │   │   │   │   └── utils.ts
│   │   │   │   ├── runtimePaths.ts
│   │   │   │   ├── shutdown/
│   │   │   │   │   ├── cleanupLocal.ts
│   │   │   │   │   ├── supervisor.ts
│   │   │   │   │   └── supervisorClient.ts
│   │   │   │   ├── timeoutConfig.ts
│   │   │   │   ├── types/
│   │   │   │   │   ├── private/
│   │   │   │   │   │   ├── agent.ts
│   │   │   │   │   │   ├── api.ts
│   │   │   │   │   │   ├── cache.ts
│   │   │   │   │   │   ├── evaluator.ts
│   │   │   │   │   │   ├── handlers.ts
│   │   │   │   │   │   ├── index.ts
│   │   │   │   │   │   ├── internal.ts
│   │   │   │   │   │   ├── locator.ts
│   │   │   │   │   │   ├── network.ts
│   │   │   │   │   │   ├── shutdown.ts
│   │   │   │   │   │   ├── shutdownErrors.ts
│   │   │   │   │   │   └── snapshot.ts
│   │   │   │   │   └── public/
│   │   │   │   │       ├── agent.ts
│   │   │   │   │       ├── api.ts
│   │   │   │   │       ├── apiErrors.ts
│   │   │   │   │       ├── context.ts
│   │   │   │   │       ├── index.ts
│   │   │   │   │       ├── locator.ts
│   │   │   │   │       ├── logs.ts
│   │   │   │   │       ├── methods.ts
│   │   │   │   │       ├── metrics.ts
│   │   │   │   │       ├── model.ts
│   │   │   │   │       ├── options.ts
│   │   │   │   │       ├── page.ts
│   │   │   │   │       ├── screenshotTypes.ts
│   │   │   │   │       └── sdkErrors.ts
│   │   │   │   ├── understudy/
│   │   │   │   │   ├── a11y/
│   │   │   │   │   │   └── snapshot/
│   │   │   │   │   │       ├── a11yTree.ts
│   │   │   │   │   │       ├── activeElement.ts
│   │   │   │   │   │       ├── capture.ts
│   │   │   │   │   │       ├── coordinateResolver.ts
│   │   │   │   │   │       ├── domTree.ts
│   │   │   │   │   │       ├── focusSelectors.ts
│   │   │   │   │   │       ├── index.ts
│   │   │   │   │   │       ├── sessions.ts
│   │   │   │   │   │       ├── treeFormatUtils.ts
│   │   │   │   │   │       └── xpathUtils.ts
│   │   │   │   │   ├── a11yInvocation.ts
│   │   │   │   │   ├── cdp.ts
│   │   │   │   │   ├── consoleMessage.ts
│   │   │   │   │   ├── context.ts
│   │   │   │   │   ├── cookies.ts
│   │   │   │   │   ├── deepLocator.ts
│   │   │   │   │   ├── executionContextRegistry.ts
│   │   │   │   │   ├── fileUploadUtils.ts
│   │   │   │   │   ├── frame.ts
│   │   │   │   │   ├── frameLocator.ts
│   │   │   │   │   ├── frameRegistry.ts
│   │   │   │   │   ├── initScripts.ts
│   │   │   │   │   ├── lifecycleWatcher.ts
│   │   │   │   │   ├── locator.ts
│   │   │   │   │   ├── locatorInvocation.ts
│   │   │   │   │   ├── navigationResponseTracker.ts
│   │   │   │   │   ├── networkManager.ts
│   │   │   │   │   ├── page.ts
│   │   │   │   │   ├── piercer.ts
│   │   │   │   │   ├── response.ts
│   │   │   │   │   ├── screenshotUtils.ts
│   │   │   │   │   └── selectorResolver.ts
│   │   │   │   ├── v3.ts
│   │   │   │   └── zodCompat.ts
│   │   │   └── v3Evaluator.ts
│   │   ├── package.json
│   │   ├── scripts/
│   │   │   ├── build-cjs.ts
│   │   │   ├── build-esm.ts
│   │   │   ├── coverage.ts
│   │   │   ├── gen-version.ts
│   │   │   ├── normalize-v8-coverage.ts
│   │   │   ├── prepare.js
│   │   │   ├── test-core.ts
│   │   │   ├── test-e2e.ts
│   │   │   └── test-utils.ts
│   │   ├── tests/
│   │   │   ├── cache-variables.test.ts
│   │   │   ├── integration/
│   │   │   │   ├── agent-abort-signal.spec.ts
│   │   │   │   ├── agent-cache-self-heal.spec.ts
│   │   │   │   ├── agent-callbacks.spec.ts
│   │   │   │   ├── agent-captcha-autosolve.spec.ts
│   │   │   │   ├── agent-experimental-validation.spec.ts
│   │   │   │   ├── agent-hybrid-mode.spec.ts
│   │   │   │   ├── agent-message-continuation.spec.ts
│   │   │   │   ├── agent-streaming.spec.ts
│   │   │   │   ├── cdp-close-api-region.spec.ts
│   │   │   │   ├── cdp-connection-close.spec.ts
│   │   │   │   ├── cdp-session-detached.spec.ts
│   │   │   │   ├── click-count.spec.ts
│   │   │   │   ├── connect-to-existing-browser.spec.ts
│   │   │   │   ├── context-addInitScript.spec.ts
│   │   │   │   ├── context-extra-http-headers.spec.ts
│   │   │   │   ├── cookies.spec.ts
│   │   │   │   ├── default-page-tracking.spec.ts
│   │   │   │   ├── downloads.spec.ts
│   │   │   │   ├── flowLogger.spec.ts
│   │   │   │   ├── frame-get-location-and-click.spec.ts
│   │   │   │   ├── iframe-ctx-addInitScript-race.spec.ts
│   │   │   │   ├── iframe-ctx-addInitScript.spec.ts
│   │   │   │   ├── keep-alive.child.ts
│   │   │   │   ├── keep-alive.spec.ts
│   │   │   │   ├── keyboard.spec.ts
│   │   │   │   ├── locator-backend-node-id.spec.ts
│   │   │   │   ├── locator-content-methods.spec.ts
│   │   │   │   ├── locator-count-iframe.spec.ts
│   │   │   │   ├── locator-count.spec.ts
│   │   │   │   ├── locator-fill.spec.ts
│   │   │   │   ├── locator-input-methods.spec.ts
│   │   │   │   ├── locator-nth.spec.ts
│   │   │   │   ├── locator-select-option.spec.ts
│   │   │   │   ├── logger-initialization.spec.ts
│   │   │   │   ├── multi-instance-logger.spec.ts
│   │   │   │   ├── nested-div.spec.ts
│   │   │   │   ├── page-addInitScript.spec.ts
│   │   │   │   ├── page-console.spec.ts
│   │   │   │   ├── page-drag-and-drop.spec.ts
│   │   │   │   ├── page-extra-http-headers.spec.ts
│   │   │   │   ├── page-goto-response.spec.ts
│   │   │   │   ├── page-hover.spec.ts
│   │   │   │   ├── page-screenshot.spec.ts
│   │   │   │   ├── page-scroll.spec.ts
│   │   │   │   ├── page-send-cdp.spec.ts
│   │   │   │   ├── perform-understudy-method.spec.ts
│   │   │   │   ├── setinputfiles.spec.ts
│   │   │   │   ├── shadow-iframe-oopif.spec.ts
│   │   │   │   ├── shadow-iframe-spif.spec.ts
│   │   │   │   ├── testUtils.ts
│   │   │   │   ├── text-selector-innermost.spec.ts
│   │   │   │   ├── timeouts.spec.ts
│   │   │   │   ├── user-data-dir.spec.ts
│   │   │   │   ├── v3.config.ts
│   │   │   │   ├── v3.dynamic.config.ts
│   │   │   │   ├── v3.playwright.config.ts
│   │   │   │   ├── wait-for-selector.spec.ts
│   │   │   │   ├── wait-for-timeout.spec.ts
│   │   │   │   └── xpath-for-location-deep.spec.ts
│   │   │   └── unit/
│   │   │       ├── agent-captcha-hooks.test.ts
│   │   │       ├── agent-execution-model.test.ts
│   │   │       ├── api-multiregion.test.ts
│   │   │       ├── browserbase-session-accessors.test.ts
│   │   │       ├── cache-llm-resolution.test.ts
│   │   │       ├── captcha-solver.test.ts
│   │   │       ├── cdp-connection-close.test.ts
│   │   │       ├── context-extra-http-headers.test.ts
│   │   │       ├── cookies.test.ts
│   │   │       ├── flowlogger-capturing-cdp.test.ts
│   │   │       ├── flowlogger-capturing-llm.test.ts
│   │   │       ├── flowlogger-eventstore.test.ts
│   │   │       ├── helpers/
│   │   │       │   └── mockCDPSession.ts
│   │   │       ├── llm-provider.test.ts
│   │   │       ├── model-deprecation.test.ts
│   │   │       ├── model-utils.test.ts
│   │   │       ├── openai-cua-client.test.ts
│   │   │       ├── page-extra-http-headers.test.ts
│   │   │       ├── page-snapshot.test.ts
│   │   │       ├── public-api/
│   │   │       │   ├── export-surface.test.ts
│   │   │       │   ├── llm-and-agents.test.ts
│   │   │       │   ├── public-error-types.test.ts
│   │   │       │   ├── public-types.test.ts
│   │   │       │   ├── runtime-utils.test.ts
│   │   │       │   ├── schema-utils.test.ts
│   │   │       │   ├── timeout-error-types.test.ts
│   │   │       │   ├── tool-type-export.test.ts
│   │   │       │   └── v3-core.test.ts
│   │   │       ├── safety-confirmation.test.ts
│   │   │       ├── snapshot-a11y-resolvers.test.ts
│   │   │       ├── snapshot-a11y-tree-utils.test.ts
│   │   │       ├── snapshot-capture-orchestration.test.ts
│   │   │       ├── snapshot-cbor.test.ts
│   │   │       ├── snapshot-dom-session-builders.test.ts
│   │   │       ├── snapshot-dom-tree-utils.test.ts
│   │   │       ├── snapshot-focus-selectors-utils.test.ts
│   │   │       ├── snapshot-frame-merge.test.ts
│   │   │       ├── snapshot-tree-format-utils.test.ts
│   │   │       ├── snapshot-xpath-utils.test.ts
│   │   │       ├── timeout-handlers.test.ts
│   │   │       ├── understudy-command-exception.test.ts
│   │   │       ├── xpath-parser.test.ts
│   │   │       ├── xpath-resolver.test.ts
│   │   │       └── zod-enum-compatibility.test.ts
│   │   ├── tsconfig.json
│   │   ├── vitest.cjs.config.mjs
│   │   ├── vitest.config.ts
│   │   └── vitest.esm.config.mjs
│   ├── docs/
│   │   ├── .gitignore
│   │   ├── README.md
│   │   ├── docs.json
│   │   ├── language-selector.js
│   │   ├── package.json
│   │   ├── scripts/
│   │   │   ├── runtimePaths.js
│   │   │   └── sync-sdk-docs.js
│   │   ├── snippets/
│   │   │   ├── excalidraw.mdx
│   │   │   └── v3-banner.mdx
│   │   ├── v2/
│   │   │   ├── basics/
│   │   │   │   ├── act.mdx
│   │   │   │   ├── agent.mdx
│   │   │   │   ├── extract.mdx
│   │   │   │   └── observe.mdx
│   │   │   ├── best-practices/
│   │   │   │   ├── agent-fallbacks.mdx
│   │   │   │   ├── build-agent.mdx
│   │   │   │   ├── caching.mdx
│   │   │   │   ├── computer-use.mdx
│   │   │   │   ├── contributing.mdx
│   │   │   │   ├── cost-optimization.mdx
│   │   │   │   ├── deployments.mdx
│   │   │   │   ├── mcp-integrations.mdx
│   │   │   │   ├── playwright-interop.mdx
│   │   │   │   ├── prompting-best-practices.mdx
│   │   │   │   ├── speed-optimization.mdx
│   │   │   │   ├── usecase-observe.mdx
│   │   │   │   ├── user-data.mdx
│   │   │   │   ├── using-multiple-tabs.mdx
│   │   │   │   └── working-with-iframes.mdx
│   │   │   ├── configuration/
│   │   │   │   ├── browser.mdx
│   │   │   │   ├── evals.mdx
│   │   │   │   ├── logging.mdx
│   │   │   │   ├── models.mdx
│   │   │   │   └── observability.mdx
│   │   │   ├── first-steps/
│   │   │   │   ├── ai-rules.mdx
│   │   │   │   ├── installation.mdx
│   │   │   │   ├── introduction.mdx
│   │   │   │   └── quickstart.mdx
│   │   │   ├── integrations/
│   │   │   │   ├── crew-ai/
│   │   │   │   │   ├── configuration.mdx
│   │   │   │   │   └── introduction.mdx
│   │   │   │   ├── langchain/
│   │   │   │   │   ├── configuration.mdx
│   │   │   │   │   └── introduction.mdx
│   │   │   │   ├── mcp/
│   │   │   │   │   ├── configuration.mdx
│   │   │   │   │   ├── introduction.mdx
│   │   │   │   │   ├── setup.mdx
│   │   │   │   │   └── tools.mdx
│   │   │   │   └── vercel/
│   │   │   │       ├── configuration.mdx
│   │   │   │       └── introduction.mdx
│   │   │   └── references/
│   │   │       ├── act.mdx
│   │   │       ├── agent.mdx
│   │   │       ├── extract.mdx
│   │   │       ├── observe.mdx
│   │   │       └── stagehand.mdx
│   │   └── v3/
│   │       ├── basics/
│   │       │   ├── act.mdx
│   │       │   ├── agent.mdx
│   │       │   ├── evals.mdx
│   │       │   ├── extract.mdx
│   │       │   └── observe.mdx
│   │       ├── best-practices/
│   │       │   ├── agent-fallbacks.mdx
│   │       │   ├── caching.mdx
│   │       │   ├── computer-use.mdx
│   │       │   ├── cost-optimization.mdx
│   │       │   ├── deployments.mdx
│   │       │   ├── deterministic-agent.mdx
│   │       │   ├── history.mdx
│   │       │   ├── mcp-integrations.mdx
│   │       │   ├── prompting-best-practices.mdx
│   │       │   ├── speed-optimization.mdx
│   │       │   ├── usecase-observe.mdx
│   │       │   ├── user-data.mdx
│   │       │   └── using-multiple-tabs.mdx
│   │       ├── configuration/
│   │       │   ├── browser.mdx
│   │       │   ├── logging.mdx
│   │       │   ├── models.mdx
│   │       │   └── observability.mdx
│   │       ├── first-steps/
│   │       │   ├── ai-rules.mdx
│   │       │   ├── installation.mdx
│   │       │   ├── introduction.mdx
│   │       │   └── quickstart.mdx
│   │       ├── integrations/
│   │       │   ├── convex/
│   │       │   │   ├── configuration.mdx
│   │       │   │   └── introduction.mdx
│   │       │   ├── crew-ai/
│   │       │   │   ├── configuration.mdx
│   │       │   │   └── introduction.mdx
│   │       │   ├── langchain/
│   │       │   │   ├── configuration.mdx
│   │       │   │   └── introduction.mdx
│   │       │   ├── mcp/
│   │       │   │   ├── configuration.mdx
│   │       │   │   ├── introduction.mdx
│   │       │   │   ├── setup.mdx
│   │       │   │   └── tools.mdx
│   │       │   ├── playwright.mdx
│   │       │   ├── puppeteer.mdx
│   │       │   ├── selenium.mdx
│   │       │   └── vercel/
│   │       │       ├── configuration.mdx
│   │       │       └── introduction.mdx
│   │       ├── migrations/
│   │       │   ├── python.mdx
│   │       │   └── v2.mdx
│   │       ├── references/
│   │       │   ├── act.mdx
│   │       │   ├── agent.mdx
│   │       │   ├── context.mdx
│   │       │   ├── deeplocator.mdx
│   │       │   ├── extract.mdx
│   │       │   ├── locator.mdx
│   │       │   ├── observe.mdx
│   │       │   ├── page.mdx
│   │       │   ├── response.mdx
│   │       │   └── stagehand.mdx
│   │       └── sdk/
│   │           ├── go.mdx
│   │           ├── java.mdx
│   │           ├── python.mdx
│   │           └── ruby.mdx
│   ├── evals/
│   │   ├── CHANGELOG.md
│   │   ├── README.md
│   │   ├── args.ts
│   │   ├── assets/
│   │   │   ├── cart.html
│   │   │   └── peeler.html
│   │   ├── browserbaseCleanup.ts
│   │   ├── cli.ts
│   │   ├── datasets/
│   │   │   ├── gaia/
│   │   │   │   └── GAIA_web.jsonl
│   │   │   ├── onlineMind2Web/
│   │   │   │   └── onlineMind2Web.jsonl
│   │   │   ├── webtailbench/
│   │   │   │   └── WebTailBench_data.jsonl
│   │   │   └── webvoyager/
│   │   │       └── WebVoyager_data.jsonl
│   │   ├── env.ts
│   │   ├── evals.config.json
│   │   ├── index.eval.ts
│   │   ├── initV3.ts
│   │   ├── lib/
│   │   │   └── AISdkClientWrapped.ts
│   │   ├── llm_clients/
│   │   │   ├── hn_aisdk.ts
│   │   │   ├── hn_customOpenAI.ts
│   │   │   └── hn_langchain.ts
│   │   ├── logger.ts
│   │   ├── package.json
│   │   ├── run.ts
│   │   ├── runtimePaths.ts
│   │   ├── scoring.ts
│   │   ├── scripts/
│   │   │   ├── build-cli.ts
│   │   │   ├── build-esm.ts
│   │   │   └── test-evals.ts
│   │   ├── suites/
│   │   │   ├── gaia.ts
│   │   │   ├── onlineMind2Web.ts
│   │   │   ├── webtailbench.ts
│   │   │   └── webvoyager.ts
│   │   ├── summary.ts
│   │   ├── taskConfig.ts
│   │   ├── tasks/
│   │   │   ├── agent/
│   │   │   │   ├── alibaba_supplier_search.ts
│   │   │   │   ├── all_recipes.ts
│   │   │   │   ├── amazon_shoes_cart.ts
│   │   │   │   ├── apple_trade_in.ts
│   │   │   │   ├── apple_tv.ts
│   │   │   │   ├── arxiv_gpt_report.ts
│   │   │   │   ├── columbia_tuition.ts
│   │   │   │   ├── flipkart_laptops.ts
│   │   │   │   ├── gaia.ts
│   │   │   │   ├── github.ts
│   │   │   │   ├── github_react_version.ts
│   │   │   │   ├── google_flights.ts
│   │   │   │   ├── google_maps.ts
│   │   │   │   ├── google_maps_2.ts
│   │   │   │   ├── google_maps_3.ts
│   │   │   │   ├── google_shopping.ts
│   │   │   │   ├── hotel_booking.ts
│   │   │   │   ├── hotels_paris_amenities.ts
│   │   │   │   ├── hugging_face.ts
│   │   │   │   ├── iframe_form.ts
│   │   │   │   ├── iframe_form_multiple.ts
│   │   │   │   ├── instacart_organic_bananas.ts
│   │   │   │   ├── kayak.ts
│   │   │   │   ├── kfc_tenders_combo.ts
│   │   │   │   ├── kith.ts
│   │   │   │   ├── made_in_china_supplier.ts
│   │   │   │   ├── nba_trades.ts
│   │   │   │   ├── nvidia_hgx_driver.ts
│   │   │   │   ├── oed_word_search.ts
│   │   │   │   ├── onlineMind2Web.ts
│   │   │   │   ├── radiotimes_tv_schedule.ts
│   │   │   │   ├── redfin_apartment_rental.ts
│   │   │   │   ├── sf_library_card.ts
│   │   │   │   ├── sf_library_card_multiple.ts
│   │   │   │   ├── sign_in.ts
│   │   │   │   ├── steam_games.ts
│   │   │   │   ├── thegamer_opinion_article.ts
│   │   │   │   ├── trailhead_superbadge.ts
│   │   │   │   ├── trivago.ts
│   │   │   │   ├── trustpilot_hr_companies.ts
│   │   │   │   ├── ubereats.ts
│   │   │   │   ├── uniqlo_mens_blazers.ts
│   │   │   │   ├── webmd_audiologist_search.ts
│   │   │   │   ├── webmd_ovulation_calculator.ts
│   │   │   │   ├── webtailbench.ts
│   │   │   │   └── webvoyager.ts
│   │   │   ├── allrecipes.ts
│   │   │   ├── amazon_add_to_cart.ts
│   │   │   ├── apple.ts
│   │   │   ├── arxiv.ts
│   │   │   ├── bidnet.ts
│   │   │   ├── checkboxes.ts
│   │   │   ├── combination_sauce.ts
│   │   │   ├── costar.ts
│   │   │   ├── csr_in_oopif.ts
│   │   │   ├── csr_in_spif.ts
│   │   │   ├── custom_dropdown.ts
│   │   │   ├── dropdown.ts
│   │   │   ├── extract_aigrant_companies.ts
│   │   │   ├── extract_aigrant_targeted.ts
│   │   │   ├── extract_aigrant_targeted_2.ts
│   │   │   ├── extract_apartments.ts
│   │   │   ├── extract_area_codes.ts
│   │   │   ├── extract_baptist_health.ts
│   │   │   ├── extract_capacitor_info.ts
│   │   │   ├── extract_collaborators.ts
│   │   │   ├── extract_csa.ts
│   │   │   ├── extract_geniusee.ts
│   │   │   ├── extract_geniusee_2.ts
│   │   │   ├── extract_github_commits.ts
│   │   │   ├── extract_github_stars.ts
│   │   │   ├── extract_hamilton_weather.ts
│   │   │   ├── extract_jfk_links.ts
│   │   │   ├── extract_jstor_news.ts
│   │   │   ├── extract_memorial_healthcare.ts
│   │   │   ├── extract_nhl_stats.ts
│   │   │   ├── extract_partners.ts
│   │   │   ├── extract_press_releases.ts
│   │   │   ├── extract_professional_info.ts
│   │   │   ├── extract_public_notices.ts
│   │   │   ├── extract_recipe.ts
│   │   │   ├── extract_regulations_table.ts
│   │   │   ├── extract_repo_name.ts
│   │   │   ├── extract_resistor_info.ts
│   │   │   ├── extract_rockauto.ts
│   │   │   ├── extract_single_link.ts
│   │   │   ├── extract_snowshoeing_destinations.ts
│   │   │   ├── extract_staff_members.ts
│   │   │   ├── extract_zillow.ts
│   │   │   ├── google_flights.ts
│   │   │   ├── heal_custom_dropdown.ts
│   │   │   ├── heal_scroll_50.ts
│   │   │   ├── heal_simple_google_search.ts
│   │   │   ├── hidden_input_dropdown.ts
│   │   │   ├── history.ts
│   │   │   ├── homedepot.ts
│   │   │   ├── iframe_form_filling.ts
│   │   │   ├── iframe_hn.ts
│   │   │   ├── iframe_same_proc.ts
│   │   │   ├── iframe_scroll.ts
│   │   │   ├── iframes_nested.ts
│   │   │   ├── imdb_movie_details.ts
│   │   │   ├── instructions.ts
│   │   │   ├── ionwave.ts
│   │   │   ├── ionwave_observe.ts
│   │   │   ├── login.ts
│   │   │   ├── multi_tab.ts
│   │   │   ├── namespace_xpath.ts
│   │   │   ├── nested_iframes_2.ts
│   │   │   ├── next_chunk.ts
│   │   │   ├── no_js_click.ts
│   │   │   ├── nonsense_action.ts
│   │   │   ├── observe_amazon_add_to_cart.ts
│   │   │   ├── observe_github.ts
│   │   │   ├── observe_iframes1.ts
│   │   │   ├── observe_iframes2.ts
│   │   │   ├── observe_simple_google_search.ts
│   │   │   ├── observe_taxes.ts
│   │   │   ├── observe_vantechjournal.ts
│   │   │   ├── observe_yc_startup.ts
│   │   │   ├── oopif_in_csr.ts
│   │   │   ├── oopif_in_osr.ts
│   │   │   ├── os_dropdown.ts
│   │   │   ├── osr_in_oopif.ts
│   │   │   ├── osr_in_spif.ts
│   │   │   ├── panamcs.ts
│   │   │   ├── peeler_complex.ts
│   │   │   ├── prev_chunk.ts
│   │   │   ├── radio_btn.ts
│   │   │   ├── rakuten_jp.ts
│   │   │   ├── sciquest.ts
│   │   │   ├── scroll_50.ts
│   │   │   ├── scroll_75.ts
│   │   │   ├── shadow_dom.ts
│   │   │   ├── simple_google_search.ts
│   │   │   ├── spif_in_csr.ts
│   │   │   ├── spif_in_osr.ts
│   │   │   ├── stock_x.ts
│   │   │   ├── tab_handling.ts
│   │   │   ├── ted_talk.ts
│   │   │   ├── vanta_h.ts
│   │   │   ├── vantechjournal.ts
│   │   │   ├── wichita.ts
│   │   │   └── wikipedia.ts
│   │   ├── tsconfig.json
│   │   ├── types/
│   │   │   ├── evals.ts
│   │   │   └── screenshotCollector.ts
│   │   ├── utils/
│   │   │   ├── ScreenshotCollector.ts
│   │   │   └── imageResize.ts
│   │   └── utils.ts
│   ├── server-v3/
│   │   ├── CHANGELOG.md
│   │   ├── README.md
│   │   ├── SDK_RELEASE_WORKFLOW.md
│   │   ├── openapi.v3.yaml
│   │   ├── package.json
│   │   ├── scripts/
│   │   │   ├── build-sea.ts
│   │   │   ├── gen-openapi.ts
│   │   │   ├── runtimePaths.ts
│   │   │   └── test-server.ts
│   │   ├── src/
│   │   │   ├── lib/
│   │   │   │   ├── InMemorySessionStore.ts
│   │   │   │   ├── SessionStore.ts
│   │   │   │   ├── auth.ts
│   │   │   │   ├── env.ts
│   │   │   │   ├── errorHandler.ts
│   │   │   │   ├── header.ts
│   │   │   │   ├── logging/
│   │   │   │   │   └── index.ts
│   │   │   │   ├── response.ts
│   │   │   │   ├── sessionStoreManager.ts
│   │   │   │   ├── stream.ts
│   │   │   │   └── utils.ts
│   │   │   ├── routes/
│   │   │   │   ├── healthcheck.ts
│   │   │   │   ├── readiness.ts
│   │   │   │   └── v1/
│   │   │   │       └── sessions/
│   │   │   │           ├── _id/
│   │   │   │           │   ├── act.ts
│   │   │   │           │   ├── agentExecute.ts
│   │   │   │           │   ├── end.ts
│   │   │   │           │   ├── extract.ts
│   │   │   │           │   ├── navigate.ts
│   │   │   │           │   ├── observe.ts
│   │   │   │           │   └── replay.ts
│   │   │   │           └── start.ts
│   │   │   ├── sea-entry.ts
│   │   │   ├── server.ts
│   │   │   └── types/
│   │   │       ├── error.ts
│   │   │       ├── fastify.d.ts
│   │   │       ├── model.ts
│   │   │       └── rrweb.ts
│   │   ├── test/
│   │   │   └── integration/
│   │   │       ├── api-server-cache.test.ts
│   │   │       ├── utils.ts
│   │   │       └── v3/
│   │   │           ├── act.test.ts
│   │   │           ├── agentExecute.test.ts
│   │   │           ├── end.test.ts
│   │   │           ├── extract.test.ts
│   │   │           ├── multiRegion.test.ts
│   │   │           ├── navigate.test.ts
│   │   │           ├── observe.test.ts
│   │   │           ├── replay.test.ts
│   │   │           └── start.test.ts
│   │   ├── tsconfig.json
│   │   ├── tsconfig.tests.json
│   │   └── vitest.config.ts
│   └── server-v4/
│       ├── CHANGELOG.md
│       ├── README.md
│       ├── openapi.v4.yaml
│       ├── package.json
│       ├── scripts/
│       │   ├── build-sea.ts
│       │   ├── gen-openapi.ts
│       │   ├── runtimePaths.ts
│       │   └── test-server.ts
│       ├── src/
│       │   ├── routes/
│       │   │   ├── healthcheck.ts
│       │   │   ├── readiness.ts
│       │   │   └── v4/
│       │   │       ├── browsersession/
│       │   │       │   ├── _id/
│       │   │       │   │   ├── end.ts
│       │   │       │   │   └── index.ts
│       │   │       │   ├── action/
│       │   │       │   │   ├── _actionId.ts
│       │   │       │   │   └── index.ts
│       │   │       │   ├── activePage.ts
│       │   │       │   ├── addCookies.ts
│       │   │       │   ├── addInitScript.ts
│       │   │       │   ├── awaitActivePage.ts
│       │   │       │   ├── browserbaseDebugURL.ts
│       │   │       │   ├── browserbaseSessionID.ts
│       │   │       │   ├── browserbaseSessionURL.ts
│       │   │       │   ├── clearCookies.ts
│       │   │       │   ├── configuredViewport.ts
│       │   │       │   ├── connectURL.ts
│       │   │       │   ├── cookies.ts
│       │   │       │   ├── getFullFrameTreeByMainFrameId.ts
│       │   │       │   ├── index.ts
│       │   │       │   ├── newPage.ts
│       │   │       │   ├── pages.ts
│       │   │       │   ├── resolvePageByMainFrameId.ts
│       │   │       │   ├── routes.ts
│       │   │       │   ├── setExtraHTTPHeaders.ts
│       │   │       │   └── shared.ts
│       │   │       ├── page/
│       │   │       │   ├── action/
│       │   │       │   │   ├── _actionId.ts
│       │   │       │   │   └── index.ts
│       │   │       │   ├── addInitScript.ts
│       │   │       │   ├── asProtocolFrameTree.ts
│       │   │       │   ├── click.ts
│       │   │       │   ├── close.ts
│       │   │       │   ├── dragAndDrop.ts
│       │   │       │   ├── enableCursorOverlay.ts
│       │   │       │   ├── evaluate.ts
│       │   │       │   ├── frames.ts
│       │   │       │   ├── getFullFrameTree.ts
│       │   │       │   ├── getOrdinal.ts
│       │   │       │   ├── goBack.ts
│       │   │       │   ├── goForward.ts
│       │   │       │   ├── goto.ts
│       │   │       │   ├── hover.ts
│       │   │       │   ├── keyPress.ts
│       │   │       │   ├── listAllFrameIds.ts
│       │   │       │   ├── mainFrame.ts
│       │   │       │   ├── mainFrameId.ts
│       │   │       │   ├── reload.ts
│       │   │       │   ├── routes.ts
│       │   │       │   ├── screenshot.ts
│       │   │       │   ├── scroll.ts
│       │   │       │   ├── sendCDP.ts
│       │   │       │   ├── setExtraHTTPHeaders.ts
│       │   │       │   ├── setViewportSize.ts
│       │   │       │   ├── shared.ts
│       │   │       │   ├── snapshot.ts
│       │   │       │   ├── targetId.ts
│       │   │       │   ├── title.ts
│       │   │       │   ├── type.ts
│       │   │       │   ├── url.ts
│       │   │       │   ├── waitForLoadState.ts
│       │   │       │   ├── waitForMainLoadState.ts
│       │   │       │   ├── waitForSelector.ts
│       │   │       │   └── waitForTimeout.ts
│       │   │       └── pluginUtils.ts
│       │   ├── schemas/
│       │   │   └── v4/
│       │   │       ├── browserSession.ts
│       │   │       └── page.ts
│       │   ├── sea-entry.ts
│       │   ├── server.ts
│       │   └── types/
│       │       ├── error.ts
│       │       ├── fastify.d.ts
│       │       ├── model.ts
│       │       └── rrweb.ts
│       ├── test/
│       │   └── integration/
│       │       ├── utils.ts
│       │       └── v4/
│       │           ├── browsersession.test.ts
│       │           └── page.test.ts
│       ├── tsconfig.json
│       ├── tsconfig.tests.json
│       └── vitest.config.ts
├── pnpm-workspace.yaml
├── stainless.yml
├── tsconfig.base.json
├── tsconfig.json
└── turbo.json

================================================
FILE CONTENTS
================================================

================================================
FILE: .changeset/config.json
================================================
{
  "$schema": "https://unpkg.com/@changesets/config@2.1.1/schema.json",
  "commit": false,
  "fixed": [],
  "linked": [],
  "baseBranch": "main",
  "updateInternalDependencies": "patch",
  "access": "public",
  "changelog": [
    "@changesets/changelog-github",
    {
      "repo": "browserbase/stagehand"
    }
  ],
  "snapshot": {
    "useCalculatedVersion": true,
    "prereleaseTemplate": "alpha-{commit}",
    "tag": "alpha"
  }
}


================================================
FILE: .changeset/crazy-nights-prove.md
================================================
---
"@browserbasehq/stagehand": patch
---

apply user defined toolTimeout to all agent tools (other than wait & think tools)


================================================
FILE: .cursorrules
================================================
# Stagehand Project

This is a project that uses Stagehand V3, a browser automation framework with AI-powered `act`, `extract`, `observe`, and `agent` methods.

The main class can be imported as `Stagehand` from `@browserbasehq/stagehand`.

**Key Classes:**

- `Stagehand`: Main orchestrator class providing `act`, `extract`, `observe`, and `agent` methods
- `context`: A `V3Context` object that manages browser contexts and pages
- `page`: Individual page objects accessed via `stagehand.context.pages()[i]` or created with `stagehand.context.newPage()`

## Initialize

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL", // or "BROWSERBASE"
  verbose: 2, // 0, 1, or 2
  model: "openai/gpt-4.1-mini", // or any supported model
});

await stagehand.init();

// Access the browser context and pages
const page = stagehand.context.pages()[0];
const context = stagehand.context;

// Create new pages if needed
const page2 = await stagehand.context.newPage();
```

## Act

Actions are called on the `stagehand` instance (not the page). Use atomic, specific instructions:

```typescript
// Act on the current active page
await stagehand.act("click the sign in button");

// Act on a specific page (when you need to target a page that isn't currently active)
await stagehand.act("click the sign in button", { page: page2 });
```

**Important:** Act instructions should be atomic and specific:

- ✅ Good: "Click the sign in button" or "Type 'hello' into the search input"
- ❌ Bad: "Order me pizza" or "Type in the search bar and hit enter" (multi-step)

### Observe + Act Pattern (Recommended)

Cache the results of `observe` to avoid unexpected DOM changes:

```typescript
const instruction = "Click the sign in button";

// Get candidate actions
const actions = await stagehand.observe(instruction);

// Execute the first action
await stagehand.act(actions[0]);
```

To target a specific page:

```typescript
const actions = await stagehand.observe("select blue as the favorite color", {
  page: page2,
});
await stagehand.act(actions[0], { page: page2 });
```

## Extract

Extract data from pages using natural language instructions. The `extract` method is called on the `stagehand` instance.

### Basic Extraction (with schema)

```typescript
import { z } from "zod";

// Extract with explicit schema
const data = await stagehand.extract(
  "extract all apartment listings with prices and addresses",
  z.object({
    listings: z.array(
      z.object({
        price: z.string(),
        address: z.string(),
      }),
    ),
  }),
);

console.log(data.listings);
```

### Simple Extraction (without schema)

```typescript
// Extract returns a default object with 'extraction' field
const result = await stagehand.extract("extract the sign in button text");

console.log(result);
// Output: { extraction: "Sign in" }

// Or destructure directly
const { extraction } = await stagehand.extract(
  "extract the sign in button text",
);
console.log(extraction); // "Sign in"
```

### Targeted Extraction

Extract data from a specific element using a selector:

```typescript
const reason = await stagehand.extract(
  "extract the reason why script injection fails",
  z.string(),
  { selector: "/html/body/div[2]/div[3]/iframe/html/body/p[2]" },
);
```

### URL Extraction

When extracting links or URLs, use `z.string().url()`:

```typescript
const { links } = await stagehand.extract(
  "extract all navigation links",
  z.object({
    links: z.array(z.string().url()),
  }),
);
```

### Extracting from a Specific Page

```typescript
// Extract from a specific page (when you need to target a page that isn't currently active)
const data = await stagehand.extract(
  "extract the placeholder text on the name field",
  { page: page2 },
);
```

## Observe

Plan actions before executing them. Returns an array of candidate actions:

```typescript
// Get candidate actions on the current active page
const [action] = await stagehand.observe("Click the sign in button");

// Execute the action
await stagehand.act(action);
```

Observing on a specific page:

```typescript
// Target a specific page (when you need to target a page that isn't currently active)
const actions = await stagehand.observe("find the next page button", {
  page: page2,
});
await stagehand.act(actions[0], { page: page2 });
```

## Agent

Use the `agent` method to autonomously execute complex, multi-step tasks.

### Basic Agent Usage

```typescript
const page = stagehand.context.pages()[0];
await page.goto("https://www.google.com");

const agent = stagehand.agent({
  model: "google/gemini-2.0-flash",
  executionModel: "google/gemini-2.0-flash",
});

const result = await agent.execute({
  instruction: "Search for the stock price of NVDA",
  maxSteps: 20,
});

console.log(result.message);
```

### Computer Use Agent (CUA)

For more advanced scenarios using computer-use models:

```typescript
const agent = stagehand.agent({
  mode: "cua", // Enable Computer Use Agent mode
  model: "anthropic/claude-sonnet-4-20250514",
  // or "google/gemini-2.5-computer-use-preview-10-2025"
  systemPrompt: `You are a helpful assistant that can use a web browser.
    Do not ask follow up questions, the user will trust your judgement.`,
});

await agent.execute({
  instruction: "Apply for a library card at the San Francisco Public Library",
  maxSteps: 30,
});
```

### Agent with Custom Model Configuration

```typescript
const agent = stagehand.agent({
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GEMINI_API_KEY,
  },
  systemPrompt: `You are a helpful assistant.`,
});
```

### Agent with Integrations (MCP/External Tools)

```typescript
const agent = stagehand.agent({
  integrations: [`https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`],
  systemPrompt: `You have access to the Exa search tool.`,
});
```

## Advanced Features

### DeepLocator (XPath Targeting)

Target specific elements across shadow DOM and iframes:

```typescript
await page
  .deepLocator("/html/body/div[2]/div[3]/iframe/html/body/p")
  .highlight({
    durationMs: 5000,
    contentColor: { r: 255, g: 0, b: 0 },
  });
```

### Multi-Page Workflows

```typescript
const page1 = stagehand.context.pages()[0];
await page1.goto("https://example.com");

const page2 = await stagehand.context.newPage();
await page2.goto("https://example2.com");

// Act/extract/observe operate on the current active page by default
// Pass { page } option to target a specific page
await stagehand.act("click button", { page: page1 });
await stagehand.extract("get title", { page: page2 });
```


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Detailed descriptions help us resolve faster
title: ''
labels: ''
assignees: ''

---

**Before submitting an issue, please:**

- [ ]  Check the [documentation](https://docs.stagehand.dev/) for relevant information
- [ ]  Search existing [issues](https://github.com/browserbase/stagehand/issues) to avoid duplicates

## Environment Information

Please provide the following information to help us reproduce and resolve your issue:

**Stagehand:**

- Language/SDK: [TypeScript, Python, MCP…]
- Stagehand version: [e.g., 1.0.0]

**AI Provider:**

- Provider: [e.g., OpenAI, Anthropic, Azure OpenAI]
- Model: [e.g., gpt-4o, claude-sonnet-4-6]

## Issue Description

```
[Describe the current behavior here]

```

### Steps to Reproduce

1. 
2. 
3. 

### Minimal Reproduction Code

```tsx
// Your minimal reproduction code here
import { Stagehand } from '@browserbase/stagehand';

const stagehand = new Stagehand({
  // IMPORTANT: include your stagehand config
});

// Steps that reproduce the issue

```

### Error Messages / Log trace

```
[Paste error messages/logs here]

```

### Screenshots / Videos

```
[Attach screenshots or videos here]

```

### Related Issues

Are there any related issues or PRs?

- Related to: #[issue number]
- Duplicate of: #[issue number]
- Blocks: #[issue number]


================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.md
================================================
---
name: Feature request
about: Suggest an idea for this project
title: ''
labels: ''
assignees: ''

---

**Is your feature request related to a problem? Please describe.**
A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]

**Describe the solution you'd like**
A clear and concise description of what you want to happen.

**Describe alternatives you've considered**
A clear and concise description of any alternative solutions or features you've considered.

**Are you willing to contribute to implementing this feature or fix?**

- [ ]  Yes, I can submit a PR
- [ ]  Yes, but I need guidance
- [ ]  No, I cannot contribute at this time


================================================
FILE: .github/actions/select-browserbase-region/action.yml
================================================
name: Select Browserbase region
description: Select a Browserbase region based on a weighted distribution.
inputs:
  distribution:
    description: Comma-separated region=weight list (e.g. us-west-2=40,us-east-1=20).
    required: true
outputs:
  region:
    description: Selected region.
    value: ${{ steps.select.outputs.region }}
runs:
  using: composite
  steps:
    - id: select
      shell: bash
      run: |
        dist="${{ inputs.distribution }}"
        if [ -z "$dist" ]; then
          echo "BROWSERBASE_REGION_DISTRIBUTION is empty"
          exit 1
        fi
        IFS=',' read -r -a entries <<< "$dist"
        total=0
        regions=()
        weights=()
        for entry in "${entries[@]}"; do
          region="${entry%%=*}"
          weight="${entry#*=}"
          region="$(printf '%s' "$region" | tr -d '[:space:]')"
          weight="$(printf '%s' "$weight" | tr -d '[:space:]')"
          if [ -z "$region" ] || [ -z "$weight" ]; then
            echo "Invalid region distribution entry: $entry"
            exit 1
          fi
          if ! [[ "$region" =~ ^[A-Za-z0-9-]+$ ]]; then
            echo "Invalid region value: $region"
            exit 1
          fi
          if ! [[ "$weight" =~ ^[0-9]+$ ]]; then
            echo "Invalid weight for region $region: $weight"
            exit 1
          fi
          regions+=("$region")
          weights+=("$weight")
          total=$((total + weight))
        done
        if [ "$total" -le 0 ]; then
          echo "Invalid total weight: $total"
          exit 1
        fi
        roll=$((RANDOM % total))
        cumulative=0
        chosen=""
        for i in "${!regions[@]}"; do
          cumulative=$((cumulative + weights[i]))
          if [ "$roll" -lt "$cumulative" ]; then
            chosen="${regions[i]}"
            break
          fi
        done
        if [ -z "$chosen" ]; then
          echo "Failed to choose Browserbase region"
          exit 1
        fi
        echo "Selected Browserbase region: $chosen"
        echo "region=$chosen" >> "$GITHUB_OUTPUT"
        echo "BROWSERBASE_REGION=$chosen" >> "$GITHUB_ENV"


================================================
FILE: .github/actions/setup-node-pnpm-turbo/action.yml
================================================
name: Setup Node, pnpm, and Turbo cache
description: Configure pnpm and Node.js with caching, restore Turbo cache, and install dependencies.
inputs:
  node-version:
    description: Node.js version to use.
    required: false
    default: "20.x"
  use-prebuilt-artifacts:
    description: Whether to download pre-built package from build artifacts.
    required: false
    default: "true"
  restore-turbo-cache:
    description: Whether to restore the local .turbo cache.
    required: false
    default: "true"

runs:
  using: composite
  steps:
    - uses: pnpm/action-setup@v4

    - name: Set up Node.js
      uses: actions/setup-node@v6
      with:
        node-version: ${{ inputs.node-version }}
        cache: 'pnpm'
        cache-dependency-path: '**/pnpm-lock.yaml'

    - name: Restore Turbo cache
      if: ${{ inputs.restore-turbo-cache == 'true' }}
      uses: actions/cache/restore@v4
      with:
        path: .turbo
        key: ${{ runner.os }}-turbo-${{ hashFiles('pnpm-lock.yaml', 'pnpm-workspace.yaml', 'package.json', 'turbo.json') }}-${{ github.sha }}
        restore-keys: |
          ${{ runner.os }}-turbo-${{ hashFiles('pnpm-lock.yaml', 'pnpm-workspace.yaml', 'package.json', 'turbo.json') }}-

    - name: Install dependencies
      shell: bash
      run: pnpm install --frozen-lockfile --prefer-offline
  
    - name: Download build artifacts
      if: ${{ inputs.use-prebuilt-artifacts == 'true' }}
      uses: actions/download-artifact@v4
      with:
        name: build-artifacts
        path: .
        merge-multiple: true

    - name: Prepare test output directories
      shell: bash
      run: |
        mkdir -p "${GITHUB_WORKSPACE}/ctrf"
        if [ -n "${NODE_V8_COVERAGE:-}" ]; then
          mkdir -p "$NODE_V8_COVERAGE"
        fi


================================================
FILE: .github/actions/upload-ctrf-report/action.yml
================================================
name: Upload CTRF report
description: Upload CTRF report artifact.
inputs:
  name:
    description: Report path (used as artifact name when sanitized).
    required: true
  path:
    description: Optional explicit path (defaults to name).
    required: false
    default: ""

runs:
  using: composite
  steps:
    - name: Normalize inputs
      id: normalize
      shell: bash
      run: |
        name="${{ inputs.name }}"
        echo "name=${name//\//-}" >> "$GITHUB_OUTPUT"
        if [ -n "${{ inputs.path }}" ]; then
          echo "path=${{ inputs.path }}" >> "$GITHUB_OUTPUT"
        else
          echo "path=${{ inputs.name }}" >> "$GITHUB_OUTPUT"
        fi

    - name: Upload CTRF report artifact
      uses: actions/upload-artifact@v4
      with:
        name: ${{ steps.normalize.outputs.name }}
        # package.json anchors uploaded paths to the repository root.
        path: |
          package.json
          ${{ steps.normalize.outputs.path }}


================================================
FILE: .github/actions/upload-v8-coverage/action.yml
================================================
name: Upload V8 coverage
description: Upload V8 coverage artifacts.
inputs:
  name:
    description: Artifact name.
    required: true
  path:
    description: Coverage path to upload (defaults to name).
    required: false
    default: ""

runs:
  using: composite
  steps:
    - name: Normalize artifact name
      id: normalize
      shell: bash
      run: |
        name="${{ inputs.name }}"
        echo "name=${name//\//-}" >> "$GITHUB_OUTPUT"
        if [ -n "${{ inputs.path }}" ]; then
          echo "path=${{ inputs.path }}" >> "$GITHUB_OUTPUT"
        else
          echo "path=${{ inputs.name }}" >> "$GITHUB_OUTPUT"
        fi

    - name: Upload coverage artifact
      uses: actions/upload-artifact@v4
      with:
        name: ${{ steps.normalize.outputs.name }}
        # package.json anchors uploaded paths to the repository root.
        path: |
          package.json
          ${{ steps.normalize.outputs.path }}


================================================
FILE: .github/actions/verify-chromium-launch/action.yml
================================================
name: Verify Chromium launch
description: Validate that Chromium can start, connect to CDP, and read the page title.
inputs:
  chrome-path:
    description: Path to Chromium/Chrome binary.
    required: false
    default: "/usr/bin/chromium"
  max-attempts:
    description: Number of launch attempts before failing.
    required: false
    default: "3"
  timeout-ms:
    description: Milliseconds to wait for DevTools and CDP per attempt.
    required: false
    default: "30000"
runs:
  using: composite
  steps:
    - shell: bash
      run: |
        set -euo pipefail
        max_attempts="${{ inputs.max-attempts }}"
        attempt=1
        while [ "$attempt" -le "$max_attempts" ]; do
          if [ -n "${{ inputs.chrome-path }}" ]; then
            pkill -f "${{ inputs.chrome-path }}" >/dev/null 2>&1 || true
          fi
          if node - <<'NODE'
        const { spawn } = require("node:child_process");
        const workspace = process.env.GITHUB_WORKSPACE;
        if (workspace) {
          process.chdir(workspace);
        }

        const chrome = "${{ inputs.chrome-path }}";

        const timeoutMs = Number("${{ inputs.timeout-ms }}");
        const wsPrefix = "DevTools listening on ";
        const sleep = (ms) => new Promise((resolve) => setTimeout(resolve, ms));

        let proc;
        let wsUrl;

        const waitForWsUrl = async () => {
          const deadline = Date.now() + timeoutMs;
          while (!wsUrl) {
            if (Date.now() > deadline) {
              throw new Error(
                `❌ Chromium did not expose CDP WS URL within timeout (${timeoutMs}ms)`,
              );
            }
            await sleep(250);
          }
          return wsUrl;
        };

        const cleanup = () => {
          if (proc && !proc.killed) {
            proc.kill("SIGKILL");
          }
        };

        (async () => {
          try {
            const startTime = Date.now();
            const args = [
              '--ash-no-nudges',
              '--block-new-web-contents',
              '--deny-permission-prompts',
              '--disable-breakpad',
              '--disable-client-side-phishing-detection',
              '--disable-component-update',
              '--disable-components=AcceptCHFrame,OptimizationHints,ProcessPerSiteUpToMainFrameThreshold,InterestFeedContentSuggestions,CalculateNativeWinOcclusion,BackForwardCache,HeavyAdPrivacyMitigations,LazyFrameLoading,ImprovedCookieControls,PrivacySandboxSettings4,AutofillServerCommunication,CertificateTransparencyComponentUpdater,DestroyProfileOnBrowserClose,CrashReporting,OverscrollHistoryNavigation,InfiniteSessionRestore',
              '--disable-datasaver-prompt',
              '--disable-default-apps',
              '--disable-desktop-notifications',
              '--disable-domain-reliability',
              '--disable-external-intent-requests',
              '--disable-hang-monitor',
              '--disable-infobars',
              '--disable-notifications',
              '--disable-popup-blocking',
              '--disable-print-preview',
              '--disable-prompt-on-repost',
              '--disable-search-engine-choice-screen',
              '--disable-session-crashed-bubble',
              '--disable-speech-api',
              '--disable-speech-synthesis-api',
              '--hide-crash-restore-bubble',
              '--metrics-recording-only',
              '--no-default-browser-check',
              '--no-first-run',
              '--no-pings',
              '--noerrdialogs',
              '--safebrowsing-disable-auto-update',
              '--silent-debugger-extension-api',
              '--simulate-outdated-no-au="Tue, 31 Dec 2099 23:59:59 GMT"',
              '--suppress-message-center-popups',
              "--disable-background-networking",
              "--disable-default-apps",
              "--disable-dev-shm-usage",
              "--disable-extensions",
              "--disable-notifications",
              "--disable-setuid-sandbox",
              "--disable-site-isolation-trials",
              "--disable-sync",
              "--disable-web-security",
              "--headless=new",
              "--no-default-browser-check",
              "--no-first-run",
              "--no-sandbox",
              "--no-zygote",
              "--password-store=basic",
              "--remote-debugging-port=0",
              "--test-type=gpu",
              "--use-mock-keychain",
              "about:blank",
            ];
            proc = spawn(chrome, args, { stdio: ["ignore", "pipe", "pipe"] });
            const lineBuffers = { stdout: "", stderr: "" };
            const onData = (stream) => (data) => {
              const text = data.toString();
              if (stream === "stderr") {
                process.stderr.write(text);
              } else {
                process.stdout.write(text);
              }
              lineBuffers[stream] += text;
              const lines = lineBuffers[stream].split(/\r?\n/);
              lineBuffers[stream] = lines.pop() ?? "";
              for (const line of lines) {
                const idx = line.indexOf(wsPrefix);
                if (idx === -1) continue;
                const rest = line.slice(idx + wsPrefix.length).trim();
                const candidate = rest.split(/\s+/)[0];
                if (
                  candidate.startsWith("ws://") ||
                  candidate.startsWith("wss://")
                ) {
                  wsUrl = candidate;
                }
              }
            };
            proc.stdout.on("data", onData("stdout"));
            proc.stderr.on("data", onData("stderr"));

            const url = await waitForWsUrl();
            const wsFoundMs = Date.now() - startTime;
            const wsFoundSec = (wsFoundMs / 1000).toFixed(2);
            const connectStart = Date.now();
            const path = require("node:path");
            const workspaceRoot = process.env.GITHUB_WORKSPACE || process.cwd();
            const playwrightPath = path.join(
              workspaceRoot,
              "packages/core/node_modules/playwright",
            );
            console.log(
              `✅ CDP Url found after ${wsFoundSec}s, connecting with playwright...`,
            );
            const { chromium } = require(playwrightPath);
            const browser = await chromium.connectOverCDP(url, {
              timeout: timeoutMs,
            });
            const context = browser.contexts()[0];
            if (!context) {
              throw new Error("❌ No browser context available after CDP connect");
            }
            const page = context.pages()[0];
            if (!page) {
              throw new Error("❌ No page available after CDP connect");
            }
            const remainingMs = timeoutMs - (Date.now() - connectStart);
            if (remainingMs <= 0) {
              throw new Error(
                `❌ CDP connect + verify timed out after ${timeoutMs}ms`,
              );
            }
            const sum = await Promise.race([
              page.evaluate("1 + 1"),
              new Promise((_, reject) =>
                setTimeout(
                  () =>
                    reject(
                      new Error(
                        `❌ CDP connect + verify timed out after ${timeoutMs}ms`,
                      ),
                    ),
                  remainingMs,
                ),
              ),
            ]);
            if (sum !== 2) {
              throw new Error(`❌ Unexpected eval result: ${sum}`);
            }
            const totalMs = Date.now() - startTime;
            const connectMs = Date.now() - connectStart;
            const totalSec = (totalMs / 1000).toFixed(2);
            const connectSec = (connectMs / 1000).toFixed(2);
            console.log(
              `✅ Chromium launched in ${wsFoundSec}s and CDP connected in ${connectSec}s (total: ${totalSec}s)`,
            );
            await browser.close();
            cleanup();
            process.exit(0);
          } catch (err) {
            cleanup();
            console.error(err instanceof Error ? err.message : String(err));
            process.exit(1);
          }
        })();
        NODE
          then
            if [ "$attempt" -gt 1 ]; then
              echo "⚠️ Chromium launch succeeded after ${attempt} attempts; GitHub Actions runner may be constrained."
            fi
            exit 0
          fi
          echo "⚠️ Chromium launch attempt ${attempt} failed."
          attempt=$((attempt + 1))
          sleep 2
        done
        echo "❌ Failed to launch Chromium before running Stagehand; GitHub Actions runner is likely overloaded."
        exit 1


================================================
FILE: .github/pull_request_template
================================================
# why

# what changed

# test plan


================================================
FILE: .github/workflows/ci.yml
================================================
name: Tests

on:
  pull_request:
    types:
      - opened
      - synchronize
      - labeled
      - unlabeled
    paths-ignore:
      - "packages/docs/**"

permissions:
  contents: read
  actions: write

env:
  BROWSERBASE_FLOW_LOGS: "1"
  LLM_MAX_MS: "15000"
  EVAL_MODELS: "openai/gpt-4.1,google/gemini-2.0-flash,anthropic/claude-haiku-4-5"
  EVAL_AGENT_MODELS: "computer-use-preview-2025-03-11,claude-sonnet-4-6"
  EVAL_CATEGORIES: "observe,act,combination,extract,targeted_extract,agent"
  EVAL_MAX_CONCURRENCY: 25
  EVAL_TRIAL_COUNT: 3
  LOCAL_SESSION_LIMIT_PER_E2E_TEST: 2
  BROWSERBASE_SESSION_LIMIT_PER_E2E_TEST: 3
  BROWSERBASE_REGION_DISTRIBUTION: "us-west-2=30,us-east-1=30,eu-central-1=20,ap-southeast-1=20"  # percentage of load for each region when running e2e tests against prod
  CHROME_PATH: /usr/bin/chromium # GitHub Actions runners ship with stable Chromium by default
  BROWSERBASE_CDP_CONNECT_MAX_MS: "10000"
  BROWSERBASE_SESSION_CREATE_MAX_MS: "60000"
  PUPPETEER_SKIP_DOWNLOAD: "1"
  PLAYWRIGHT_SKIP_DOWNLOAD: "1"
  TURBO_TELEMETRY_DISABLED: "1"

concurrency:
  group: ${{ github.workflow }}-${{ github.ref }}
  cancel-in-progress: true

jobs:
  determine-changes:
    runs-on: ubuntu-latest
    outputs:
      core: ${{ steps.filter.outputs.core }}
      cli: ${{ steps.filter.outputs.cli }}
      evals: ${{ steps.filter.outputs.evals }}
      server: ${{ steps.filter.outputs.server }}
      docs-only: ${{ steps.filter.outputs.docs-only }}
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - name: Log GitHub API rate limit
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        run: |
          headers_file=$(mktemp)
          body_file=$(mktemp)
          curl -sSL \
            -D "$headers_file" \
            -o "$body_file" \
            -H "Accept: application/vnd.github+json" \
            -H "X-GitHub-Api-Version: 2022-11-28" \
            -H "Authorization: Bearer $GITHUB_TOKEN" \
            https://api.github.com/rate_limit
          cat "$headers_file"
          echo ""
          cat "$body_file"
          remaining=$(jq -r '.rate.remaining' "$body_file")
          if [ "$remaining" -eq 0 ]; then
            reset_epoch=$(jq -r '.rate.reset' "$body_file")
            reset_utc=$(date -u -d "@$reset_epoch" +"%Y-%m-%d %H:%M:%S")
            reset_pacific=$(TZ=America/Los_Angeles date -d "@$reset_epoch" +"%Y-%m-%d %H:%M:%S %Z")
            echo "Github API rate limited until: ${reset_pacific} (${reset_utc} UTC)" >> "$GITHUB_STEP_SUMMARY"
            echo "GitHub API rate limit exhausted."
            exit 1
          fi

      - uses: dorny/paths-filter@v3
        id: filter
        with:
          filters: |
            core:
              - '.github/workflows/ci.yml'
              - 'packages/core/**'
              - 'package.json'
              - 'pnpm-lock.yaml'
              - 'turbo.json'
            cli:
              - 'packages/cli/**'
              - 'packages/core/**'
              - 'package.json'
              - 'pnpm-lock.yaml'
            evals:
              - 'packages/evals/**'
              - 'package.json'
              - 'pnpm-lock.yaml'
            server:
              - 'packages/server-v3/**'
              - 'packages/server-v4/**'
              - 'packages/core/**'
              - 'package.json'
              - 'pnpm-lock.yaml'
              - 'pnpm-workspace.yaml'
              - '.github/workflows/ci.yml'
            docs-only:
              - '**/*.md'
              - 'examples/**'
              - '!packages/**/*.md'

  determine-evals:
    needs: [determine-changes]
    runs-on: ubuntu-latest
    outputs:
      skip-all-evals: ${{ steps.check-labels.outputs.skip-all-evals }}
      eval-categories: ${{ steps.check-labels.outputs.eval-categories }}
    steps:
      - id: check-labels
        run: |
          categories=()
          declare -A seen
          add_category() {
            local category="$1"
            if [[ -z "${seen[$category]:-}" ]]; then
              categories+=("$category")
              seen["$category"]=1
            fi
          }

          emit_categories() {
            local json="["
            for category in "${categories[@]}"; do
              json+="\"${category}\","
            done
            json="${json%,}"
            json+="]"
            echo "eval-categories=$json" >> $GITHUB_OUTPUT
          }

          # Check if skip-evals label is present
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'skip-evals') }}" == "true" ]]; then
            echo "skip-evals label found - skipping all evals"
            echo "skip-all-evals=true" >> $GITHUB_OUTPUT
            emit_categories
            exit 0
          fi

          # Skip evals if only docs/examples changed
          if [[ "${{ needs.determine-changes.outputs.docs-only }}" == "true" && "${{ needs.determine-changes.outputs.core }}" == "false" && "${{ needs.determine-changes.outputs.evals }}" == "false" ]]; then
            echo "Only docs/examples changed - skipping evals"
            echo "skip-all-evals=true" >> $GITHUB_OUTPUT
            emit_categories
            exit 0
          fi

          # Check for skip-regression-evals label
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'skip-regression-evals') }}" == "true" ]]; then
            echo "skip-regression-evals label found - regression evals will be skipped"
          else
            echo "Regression evals will run by default"
            add_category "regression"
          fi

          # Check for specific labels
          echo "skip-all-evals=false" >> $GITHUB_OUTPUT
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'combination') }}" == "true" ]]; then
            add_category "combination"
          fi
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'extract') }}" == "true" ]]; then
            add_category "extract"
          fi
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'act') }}" == "true" ]]; then
            add_category "act"
          fi
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'observe') }}" == "true" ]]; then
            add_category "observe"
          fi
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'targeted-extract') }}" == "true" ]]; then
            add_category "targeted_extract"
          fi
          if [[ "${{ contains(github.event.pull_request.labels.*.name, 'agent') }}" == "true" ]]; then
            add_category "agent"
          fi
          emit_categories
      
  run-lint:
    name: Lint
    runs-on: ubuntu-latest
    needs: [run-build]
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"
          node-version: 20.x

      - name: Run Lint
        run: pnpm exec turbo run lint

  cancel-after-lint-failure:
    name: Cancel after lint failure
    runs-on: ubuntu-latest
    needs: [run-lint]
    if: ${{ always() && needs.run-lint.result == 'failure' }}
    continue-on-error: true
    steps:
      - name: Cancel workflow run
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        run: |
          curl -sSfL -X POST \
            -H "Authorization: Bearer ${GITHUB_TOKEN}" \
            -H "Accept: application/vnd.github+json" \
            -H "X-GitHub-Api-Version: 2022-11-28" \
            "https://api.github.com/repos/${GITHUB_REPOSITORY}/actions/runs/${GITHUB_RUN_ID}/cancel"

  run-build:
    name: Build
    runs-on: ubuntu-latest
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "false"
          node-version: 20.x

      - name: Run Build
        run: pnpm exec turbo run build

      - name: Save Turbo cache
        if: always()
        uses: actions/cache/save@v4
        with:
          path: .turbo
          key: ${{ runner.os }}-turbo-${{ hashFiles('pnpm-lock.yaml', 'pnpm-workspace.yaml', 'package.json', 'turbo.json') }}-${{ github.sha }}

      - name: Upload build artifacts
        uses: actions/upload-artifact@v4
        with:
          name: build-artifacts
          include-hidden-files: true
          # package.json is included to anchor artifact paths at repo root.
          path: |
            package.json
            packages/core/dist/**
            packages/core/lib/version.ts
            packages/core/lib/dom/build/**
            packages/core/lib/v3/dom/build/**
            packages/cli/dist/**
            packages/evals/dist/**
            packages/server-v3/dist/**
            packages/server-v3/openapi.v3.yaml
            packages/server-v4/dist/**
            packages/server-v4/openapi.v4.yaml
          retention-days: 1

  run-cli-tests:
    name: CLI Tests
    runs-on: ubuntu-latest
    needs: [run-build, determine-changes]
    if: needs.determine-changes.outputs.cli == 'true'
    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - name: Run CLI Tests
        run: pnpm exec turbo run test:cli --filter=@browserbasehq/browse-cli

  discover-core-tests:
    runs-on: ubuntu-latest
    needs: [determine-changes]
    if: needs.determine-changes.outputs.core == 'true'
    outputs:
      core-tests: ${{ steps.set-matrix.outputs.core-tests }}
      has-core-tests: ${{ steps.set-matrix.outputs.has-core-tests }}

    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "false"
          restore-turbo-cache: "false"

      - name: Discover core test files
        id: set-matrix
        run: |
          core_json=$(pnpm --filter @browserbasehq/stagehand --silent run test:core -- --list)
          echo "core-tests=$core_json" >> $GITHUB_OUTPUT

          if [ "$core_json" = "[]" ]; then
            echo "has-core-tests=false" >> $GITHUB_OUTPUT
          else
            echo "has-core-tests=true" >> $GITHUB_OUTPUT
          fi

          echo "Found core tests: $core_json"

  core-unit-tests:
    name: core/${{ matrix.test.name }}
    runs-on: ubuntu-latest
    needs: [run-build, discover-core-tests]
    if: needs.discover-core-tests.outputs.has-core-tests == 'true'
    env:
      STAGEHAND_BROWSER_TARGET: local
      STAGEHAND_SERVER_TARGET: local

    strategy:
      fail-fast: false
      max-parallel: 100
      matrix:
        test: ${{ fromJson(needs.discover-core-tests.outputs.core-tests) }}

    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - name: Run Vitest - ${{ matrix.test.name }}
        run: |
          pnpm exec turbo run test:core --only --filter=@browserbasehq/stagehand -- "${{ matrix.test.path }}"

      - uses: ./.github/actions/upload-ctrf-report
        if: always()
        with:
          name: ctrf/core-unit/${{ matrix.test.name }}.json

      - uses: ./.github/actions/upload-v8-coverage
        if: always()
        with:
          name: coverage/core-unit/${{ matrix.test.name }}

  discover-server-tests:
    runs-on: ubuntu-latest
    needs: [determine-changes]
    if: needs.determine-changes.outputs.server == 'true'
    outputs:
      integration-tests: ${{ steps.set-matrix.outputs.integration-tests }}
      has-integration-tests: ${{ steps.set-matrix.outputs.has-integration-tests }}

    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "false"
          restore-turbo-cache: "false"

      - name: Discover server test files
        id: set-matrix
        run: |
          int_json=$(pnpm --filter @browserbasehq/stagehand-server-v3 --silent run test:server -- --list integration)
          echo "integration-tests=$int_json" >> $GITHUB_OUTPUT

          if [ "$int_json" = "[]" ]; then
            echo "has-integration-tests=false" >> $GITHUB_OUTPUT
          else
            echo "has-integration-tests=true" >> $GITHUB_OUTPUT
          fi

          echo "Found server integration tests: $int_json"

  build-server-sea:
    name: Build SEA binary (tests, v3)
    uses: ./.github/workflows/stagehand-server-v3-sea-build.yml
    needs: [run-build]
    with:
      matrix: |
        [
          {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v3-linux-x64","include_sourcemaps":false},
          {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v3-linux-arm64","include_sourcemaps":false},
          {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v3-darwin-arm64","include_sourcemaps":false},
          {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v3-darwin-x64","include_sourcemaps":false},
          {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v3-win32-x64.exe","include_sourcemaps":false},
          {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v3-win32-arm64.exe","include_sourcemaps":false},
          {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v3-linux-x64-sourcemap","include_sourcemaps":true}
        ]
      use-prebuilt-artifacts: "true"
      restore-turbo-cache: "false"
      node-version: "20.x"
      upload-only-binary: stagehand-server-v3-linux-x64-sourcemap

  server-integration-tests:
    name: server/v3/integration/${{ matrix.test.name }}
    runs-on: ubuntu-latest
    needs: [build-server-sea, discover-server-tests, run-build]
    if: needs.discover-server-tests.outputs.has-integration-tests == 'true'

    strategy:
      fail-fast: false
      matrix:
        test: ${{ fromJson(needs.discover-server-tests.outputs.integration-tests) }}

    env:
      BB_ENV: local
      STAGEHAND_BASE_URL: http://stagehand-api.localhost:3106
      STAGEHAND_BROWSER_TARGET: local
      STAGEHAND_SERVER_TARGET: sea
      OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
      GEMINI_API_KEY: ${{ secrets.GEMINI_API_KEY }}
      ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
      # Used only for testing /start with env: BROWSERBASE remote browser
      BROWSERBASE_API_KEY: ${{ secrets.BROWSERBASE_API_KEY }}
      BROWSERBASE_PROJECT_ID: ${{ secrets.BROWSERBASE_PROJECT_ID }}

    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - name: Download SEA binary
        uses: actions/download-artifact@v4
        with:
          name: stagehand-server-v3-linux-x64-sourcemap
          path: .

      - name: Ensure SEA binary is present and executable
        shell: bash
        run: |
          set -euo pipefail
          test -f packages/server-v3/dist/sea/stagehand-server-v3-linux-x64-sourcemap
          chmod +x packages/server-v3/dist/sea/stagehand-server-v3-linux-x64-sourcemap

      - name: Run server integration test - ${{ matrix.test.name }}
        env:
          SEA_BINARY_NAME: stagehand-server-v3-linux-x64-sourcemap
        run: |
          pnpm exec turbo run test:server --only --filter=@browserbasehq/stagehand-server-v3 -- "${{ matrix.test.path }}"

      - uses: ./.github/actions/upload-ctrf-report
        if: always()
        with:
          name: ctrf/server-v3-integration/${{ matrix.test.name }}.json

      - uses: ./.github/actions/upload-v8-coverage
        if: always()
        with:
          name: coverage/server-v3-integration/${{ matrix.test.name }}

  discover-e2e-tests:
    runs-on: ubuntu-latest
    needs: [determine-changes]
    if: needs.determine-changes.outputs.core == 'true'
    outputs:
      e2e-tests: ${{ steps.set-matrix.outputs.e2e-tests }}
      has-e2e-tests: ${{ steps.set-matrix.outputs.has-e2e-tests }}

    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "false"
          restore-turbo-cache: "false"

      - name: Discover e2e test files
        id: set-matrix
        run: |
          e2e_json=$(pnpm --filter @browserbasehq/stagehand --silent run test:e2e -- --list)
          echo "e2e-tests=$e2e_json" >> $GITHUB_OUTPUT

          if [ "$e2e_json" = "[]" ]; then
            echo "has-e2e-tests=false" >> $GITHUB_OUTPUT
          else
            echo "has-e2e-tests=true" >> $GITHUB_OUTPUT
          fi

          echo "Found e2e tests: $e2e_json"

  run-e2e-local-tests:
    name: e2e/local/${{ matrix.test.name }}
    needs: [run-build, discover-e2e-tests]
    runs-on: ubuntu-latest
    timeout-minutes: 50
    if: >
      needs.discover-e2e-tests.outputs.has-e2e-tests == 'true' &&
      github.event.pull_request.head.repo.full_name == github.repository
    env:
      OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
      ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
      GOOGLE_GENERATIVE_AI_API_KEY: ${{ secrets.GOOGLE_GENERATIVE_AI_API_KEY }}
      BROWSERBASE_API_KEY: ${{ secrets.BROWSERBASE_API_KEY }}
      BROWSERBASE_PROJECT_ID: ${{ secrets.BROWSERBASE_PROJECT_ID }}
      HEADLESS: true
      STAGEHAND_BROWSER_TARGET: local
      STAGEHAND_SERVER_TARGET: local
    strategy:
      fail-fast: false
      max-parallel: 20
      matrix:
        test: ${{ fromJson(needs.discover-e2e-tests.outputs.e2e-tests) }}
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - uses: ./.github/actions/verify-chromium-launch

      - name: Run local E2E Tests - ${{ matrix.test.name }}
        run: |
          pnpm exec turbo run test:e2e --only --filter=@browserbasehq/stagehand -- "${{ matrix.test.path }}"

      - uses: ./.github/actions/upload-ctrf-report
        if: always()
        with:
          name: ctrf/e2e-local/${{ matrix.test.name }}.json

      - uses: ./.github/actions/upload-v8-coverage
        if: always()
        with:
          name: coverage/e2e-local/${{ matrix.test.name }}

  run-e2e-bb-tests:
    name: e2e/bb/${{ matrix.test.name }}
    needs: [run-build, discover-e2e-tests]
    runs-on: ubuntu-latest
    timeout-minutes: 50
    if: >
      needs.discover-e2e-tests.outputs.has-e2e-tests == 'true' &&
      github.event.pull_request.head.repo.full_name == github.repository
    env:
      OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
      ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
      GOOGLE_GENERATIVE_AI_API_KEY: ${{ secrets.GOOGLE_GENERATIVE_AI_API_KEY }}
      BROWSERBASE_API_KEY: ${{ secrets.BROWSERBASE_API_KEY }}
      BROWSERBASE_PROJECT_ID: ${{ secrets.BROWSERBASE_PROJECT_ID }}
      HEADLESS: true
      STAGEHAND_BROWSER_TARGET: browserbase
      STAGEHAND_SERVER_TARGET: local
    strategy:
      fail-fast: false
      max-parallel: 100
      matrix:
        test: ${{ fromJson(needs.discover-e2e-tests.outputs.e2e-tests) }}
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - name: Select Browserbase region
        uses: ./.github/actions/select-browserbase-region
        with:
          distribution: ${{ env.BROWSERBASE_REGION_DISTRIBUTION }}

      - name: Run E2E Tests (browserbase) - ${{ matrix.test.name }}
        run: |
          pnpm exec turbo run test:e2e --only --filter=@browserbasehq/stagehand -- "${{ matrix.test.path }}"

      - uses: ./.github/actions/upload-ctrf-report
        if: always()
        with:
          name: ctrf/e2e-bb/${{ matrix.test.name }}.json

      - uses: ./.github/actions/upload-v8-coverage
        if: always()
        with:
          name: coverage/e2e-bb/${{ matrix.test.name }}

  run-evals:
    name: evals/${{ matrix.category }}
    needs: [run-build, determine-evals, run-e2e-bb-tests]
    if: >-
      ${{
        always() &&
        needs.run-build.result == 'success' &&
        needs.determine-evals.result == 'success' &&
        needs.run-e2e-bb-tests.result != 'failure' &&
        needs.run-e2e-bb-tests.result != 'cancelled' &&
        needs.determine-evals.outputs.skip-all-evals != 'true' &&
        needs.determine-evals.outputs.eval-categories != '[]'
      }}
    runs-on: ubuntu-latest
    timeout-minutes: 90
    strategy:
      fail-fast: false
      matrix:
        category: ${{ fromJson(needs.determine-evals.outputs.eval-categories) }}
    env:
      OPENAI_API_KEY: ${{ secrets.OPENAI_API_KEY }}
      ANTHROPIC_API_KEY: ${{ secrets.ANTHROPIC_API_KEY }}
      GOOGLE_GENERATIVE_AI_API_KEY: ${{ secrets.GOOGLE_GENERATIVE_AI_API_KEY }}
      BRAINTRUST_API_KEY: ${{ secrets.BRAINTRUST_API_KEY }}
      BROWSERBASE_API_KEY: ${{ secrets.BROWSERBASE_API_KEY }}
      BROWSERBASE_PROJECT_ID: ${{ secrets.BROWSERBASE_PROJECT_ID }}
      STAGEHAND_BROWSER_TARGET: browserbase
      STAGEHAND_SERVER_TARGET: local
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - name: Select Browserbase region
        uses: ./.github/actions/select-browserbase-region
        with:
          distribution: ${{ env.BROWSERBASE_REGION_DISTRIBUTION }}

      - name: Run Evals - ${{ matrix.category }}
        id: run-evals
        env:
          NODE_V8_COVERAGE: coverage/evals/${{ matrix.category }}
        run: |
          log_file="$(mktemp)"
          set +e
          pnpm exec turbo run test:evals --only --filter=@browserbasehq/stagehand-evals -- "${{ matrix.category }}" -t "${EVAL_TRIAL_COUNT}" -c "${EVAL_MAX_CONCURRENCY}" 2>&1 | tee "$log_file"
          eval_status=${PIPESTATUS[0]}
          set -e

          summary_block="$(
            awk '
              /^=========================SUMMARY=========================$/ { capture=1 }
              capture { print }
              /^Evaluation summary written to / { capture=0 }
            ' "$log_file"
          )"

          if [ -n "$summary_block" ]; then
            {
              echo "summary_text<<EOF"
              echo "$summary_block"
              echo "EOF"
            } >> "$GITHUB_OUTPUT"
          fi

          exit "$eval_status"

      - name: Log Evals Performance - ${{ matrix.category }}
        env:
          EVAL_STDOUT_SUMMARY: ${{ steps.run-evals.outputs.summary_text }}
        run: |
          if [ -n "${EVAL_STDOUT_SUMMARY:-}" ]; then
            echo "### Evals Summary (${{ matrix.category }})" >> "$GITHUB_STEP_SUMMARY"
            echo '```' >> "$GITHUB_STEP_SUMMARY"
            printf '%s\n' "$EVAL_STDOUT_SUMMARY" >> "$GITHUB_STEP_SUMMARY"
            echo '```' >> "$GITHUB_STEP_SUMMARY"
          fi
          experimentName=$(jq -r '.experimentName' eval-summary.json)
          echo "View results at https://www.braintrust.dev/app/Browserbase/p/stagehand/experiments/${experimentName}"
          if [ -f eval-summary.json ]; then
            category_score=$(jq ".categories[\"${{ matrix.category }}\"]" eval-summary.json)
            echo "${{ matrix.category }} category score: $category_score%"
            if (( $(echo "$category_score < 80" | bc -l) )); then
              echo "${{ matrix.category }} category score is below 80%. Failing CI."
              exit 1
            fi
          else
            echo "Eval summary not found for ${{ matrix.category }} category. Failing CI."
            exit 1
          fi

      - uses: ./.github/actions/upload-ctrf-report
        if: always()
        with:
          name: ctrf/evals/${{ matrix.category }}.json

      - uses: ./.github/actions/upload-v8-coverage
        if: always()
        with:
          name: coverage/evals/${{ matrix.category }}

  merge-coverage:
    name: Code Coverage Report
    runs-on: ubuntu-latest
    needs:
      - core-unit-tests
      - run-e2e-local-tests
      - run-e2e-bb-tests
      - run-evals
      - server-integration-tests
    # if: always()
    if: false
    steps:
      - uses: actions/checkout@v4
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "true"
          restore-turbo-cache: "false"

      - name: Download V8 coverage artifacts
        uses: actions/download-artifact@v4
        continue-on-error: true
        with:
          pattern: coverage-*
          path: .
          merge-multiple: true

      - name: Download CTRF artifacts
        uses: actions/download-artifact@v4
        continue-on-error: true
        with:
          pattern: ctrf-*
          path: .
          merge-multiple: true

      - name: Generate merged coverage report
        run: |
          pnpm run coverage:merge

      - name: Upload merged coverage report
        if: always()
        id: upload-coverage-artifact
        uses: actions/upload-artifact@v4
        with:
          name: coverage-merged
          # package.json is included to anchor artifact paths at repo root.
          path: |
            package.json
            coverage/merged

      - name: Add coverage summary to job summary
        if: always()
        shell: bash
        run: |
          echo "### Code Coverage" >> "$GITHUB_STEP_SUMMARY"
          echo "" >> "$GITHUB_STEP_SUMMARY"
          if [ -f coverage/merged/coverage-summary.txt ]; then
            echo '```' >> "$GITHUB_STEP_SUMMARY"
            cat coverage/merged/coverage-summary.txt >> "$GITHUB_STEP_SUMMARY"
            echo '```' >> "$GITHUB_STEP_SUMMARY"
          else
            echo "Coverage summary not available." >> "$GITHUB_STEP_SUMMARY"
          fi
          if [ -n "${{ steps.upload-coverage-artifact.outputs.artifact-url }}" ]; then
            echo "" >> "$GITHUB_STEP_SUMMARY"
            echo "[Download full HTML coverage report](${{ steps.upload-coverage-artifact.outputs.artifact-url }})" >> "$GITHUB_STEP_SUMMARY"
          fi

      - name: Publish merged CTRF report
        if: always()
        uses: ctrf-io/github-test-reporter@v1
        with:
          report-path: './ctrf/**/*.json'
          summary: true
          summary-report: false
          summary-delta-report: true
          test-report: false
          failed-report: false
          insights-report: true
          flaky-rate-report: true
          fail-rate-report: true
          slowest-report: true
          previous-results-report: true
          fetch-previous-results: true
          baseline: 1
          previous-results-max: 1
          max-workflow-runs-to-check: 5
          max-previous-runs-to-fetch: 1
          upload-artifact: true
          artifact-name: ctrf-report-merged
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}

      - name: Compute coverage status metrics
        if: always()
        id: coverage-status
        shell: bash
        run: |
          set -euo pipefail
          shopt -s globstar nullglob
          tests_failed=0
          ctrf_files=(ctrf/**/*.json)
          if [ "${#ctrf_files[@]}" -gt 0 ]; then
            tests_failed=$(jq -s '[.[].results.summary.failed // 0] | add' "${ctrf_files[@]}")
          fi
          total_coverage=0
          if [ -f coverage/merged/coverage-summary.txt ]; then
            total_coverage=$(awk '/^Lines/ {gsub(/%/,"",$3); print $3}' coverage/merged/coverage-summary.txt)
          fi
          echo "tests_failed=${tests_failed}" >> "$GITHUB_OUTPUT"
          echo "total_coverage=${total_coverage}" >> "$GITHUB_OUTPUT"

      - name: Set coverage status
        if: always()
        continue-on-error: true
        shell: bash
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
          RUN_ID: ${{ github.run_id }}
          PULL_NUMBER: ${{ github.event.pull_request.number }}
          TESTS_FAILED: ${{ steps.coverage-status.outputs.tests_failed }}
          TOTAL_COVERAGE: ${{ steps.coverage-status.outputs.total_coverage }}
        run: |
          set -euo pipefail
          repo="${GITHUB_REPOSITORY}"
          sha="${GITHUB_SHA}"
          tests_failed="${TESTS_FAILED:-0}"
          total_coverage="${TOTAL_COVERAGE:-0}"
          state="success"
          if [ -n "${PULL_NUMBER:-}" ]; then
            target_url="https://github.com/${repo}/pull/${PULL_NUMBER}/checks?check_run_id=${RUN_ID}"
          else
            target_url="https://github.com/${repo}/actions/runs/${RUN_ID}"
          fi
          description="non-blocking report: ${tests_failed} tests failed. ${total_coverage}% coverage"
          payload=$(jq -n \
            --arg state "$state" \
            --arg target_url "$target_url" \
            --arg description "$description" \
            --arg context "Measured coverage" \
            '{state: $state, target_url: $target_url, description: $description, context: $context}')
          curl -sSfL -X POST \
            -H "Authorization: Bearer ${GITHUB_TOKEN}" \
            -H "Accept: application/vnd.github+json" \
            -H "X-GitHub-Api-Version: 2022-11-28" \
            "https://api.github.com/repos/${repo}/statuses/${sha}" \
            -d "$payload"


================================================
FILE: .github/workflows/claude.yml
================================================
name: Claude Code

on:
  issue_comment:
    types: [created]
  pull_request_review_comment:
    types: [created]
  issues:
    types: [opened, assigned]
  pull_request_review:
    types: [submitted]

env:
  BROWSERBASE_FLOW_LOGS: "1"

jobs:
  claude:
    if: |
      (github.event_name == 'issue_comment' && contains(github.event.comment.body, '@claude')) ||
      (github.event_name == 'pull_request_review_comment' && contains(github.event.comment.body, '@claude')) ||
      (github.event_name == 'pull_request_review' && contains(github.event.review.body, '@claude')) ||
      (github.event_name == 'issues' && (contains(github.event.issue.body, '@claude') || contains(github.event.issue.title, '@claude')))
    runs-on: ubuntu-latest
    permissions:
      contents: write
      pull-requests: write
      issues: write
      id-token: write
      actions: write # Required for Claude to read CI results on PRs / rerun actions that failed
    steps:
      - name: Checkout repository
        uses: actions/checkout@v6
        with:
          fetch-depth: 1

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "false"
          restore-turbo-cache: "false"
          node-version: 20.x

      - name: Run Build
        run: |
          pnpm exec turbo run build

      - name: Run Claude Code
        id: claude
        uses: anthropics/claude-code-action@v1
        with:
          anthropic_api_key: ${{ secrets.ANTHROPIC_API_KEY }}

          # This is an optional setting that allows Claude to read CI results on PRs
          additional_permissions: |
            actions: read

          track_progress: true

          # Optional: Give a custom prompt to Claude. If this is not specified, Claude will perform the instructions specified in the comment that tagged it.
          prompt: 'Make sure "turbo run lint" and "turbo run build" pass before pushing and make sure to check present CI status for the branch and fix any easy failures. Prefer using the Github MCP tools over bash for Github operations, fall back to Bash(gh) for anything not supported by the MCP tools.'

          branch_prefix: 'claude-'
          # Optional: Add claude_args to customize behavior and configuration
          # See https://github.com/anthropics/claude-code-action/blob/main/docs/usage.md
          # or https://code.claude.com/docs/en/cli-reference for available options
          claude_args: |
            --allowed-tools mcp__github_inline_comment__create_inline_comment,Bash,View,Glob,GlobTool,GrepTool,Grep,BatchTool,WebSearch,LS,Edit,MultiEdit,Write,Read


# consider adding in the future:
# - https://github.com/anthropics/claude-code-action/blob/main/examples/test-failure-analysis.yml
# - https://github.com/anthropics/claude-code-action/blob/main/examples/ci-failure-auto-fix.yml
# - https://github.com/anthropics/claude-code-action/blob/main/examples/issue-deduplication.yml


================================================
FILE: .github/workflows/external-contributor-pr-approval-handoff.yml
================================================
name: External Contributor PR Approval Handoff

on:
  pull_request_review:
    types:
      - submitted

permissions:
  contents: read
  pull-requests: read

jobs:
  capture-approved-review:
    runs-on: ubuntu-latest
    steps:
      - name: Write approval handoff payload
        uses: actions/github-script@v7
        with:
          github-token: ${{ secrets.GITHUB_TOKEN }}
          script: |
            const fs = require('fs');
            const pr = context.payload.pull_request;
            const review = context.payload.review;
            const shouldClaim =
              review.state === 'approved' &&
              pr.head.repo.full_name !== context.payload.repository.full_name;

            const payload = {
              shouldClaim,
              prNumber: pr.number,
              reviewer: review.user?.login || '',
              reviewId: review.id,
              approvedSha: review.commit_id || pr.head.sha,
            };

            fs.writeFileSync('approval-handoff.json', JSON.stringify(payload));

      - name: Upload approval handoff artifact
        uses: actions/upload-artifact@v4
        with:
          name: approved-review
          path: approval-handoff.json
          retention-days: 1


================================================
FILE: .github/workflows/external-contributor-pr.yml
================================================
name: External Contributor PR

on:
  pull_request_target:
    types:
      - opened
      - reopened
      - synchronize
      - closed
  workflow_run:
    workflows:
      - External Contributor PR Approval Handoff
    types:
      - completed

permissions:
  actions: read
  contents: write
  pull-requests: write
  issues: write

env:
  ECPR_LIB: |
    (() => {
      const LABELS = [
        { name: 'external-contributor', color: '8b949e', description: 'Tracks PRs mirrored from external contributor forks.' },
        { name: 'external-contributor:awaiting-approval', color: 'd29922', description: 'Waiting for a stagehand team member to approve the latest external commit.' },
        { name: 'external-contributor:mirrored', color: '1f6feb', description: 'An internal mirrored PR currently exists for this external contributor PR.' },
        { name: 'external-contributor:stale', color: 'db6d28', description: 'The mirrored PR is stale and waiting for a fresh approval to refresh.' },
        { name: 'external-contributor:completed', color: '2da44e', description: 'The mirrored PR has been merged and the external contributor flow is complete.' },
      ];
      const MANAGED_LABELS = new Set(LABELS.map((label) => label.name));
      const MANAGED_COMMENT_AUTHOR = 'github-actions[bot]';
      const CLAIM_RE = /<!-- external-contributor-pr:claim owned-pr=(\d+) source-sha=([0-9a-f]{40}) claimer=([A-Za-z0-9-]+) branch=([^ ]+) -->/;
      const OWNED_RE = /<!-- external-contributor-pr:owned source-pr=(\d+) source-sha=([0-9a-f]{40}) claimer=([A-Za-z0-9-]+) -->/;
      const NOTICE_MARKER = '<!-- external-contributor-pr:notice -->';
      const NOTICE_LINES = [
        'This PR is from an external contributor and must be approved by a stagehand team member with write access before CI can run.',
        'Approving the latest commit mirrors it into an internal PR owned by the approver.',
        'If new commits are pushed later, the internal PR stays open but is marked stale until someone approves the latest external commit and refreshes it.',
      ];

      async function ensureLabels(github, context) {
        for (const label of LABELS) {
          try {
            await github.rest.issues.getLabel({ owner: context.repo.owner, repo: context.repo.repo, name: label.name });
          } catch (error) {
            if (error.status !== 404) throw error;
            try {
              await github.rest.issues.createLabel({
                owner: context.repo.owner,
                repo: context.repo.repo,
                name: label.name,
                color: label.color,
                description: label.description,
              });
            } catch (createError) {
              if (createError.status !== 422) throw createError;
            }
          }
        }
      }

      async function listComments(github, context, issueNumber) {
        return github.paginate(github.rest.issues.listComments, {
          owner: context.repo.owner,
          repo: context.repo.repo,
          issue_number: issueNumber,
          per_page: 100,
        });
      }

      function isManagedComment(comment) {
        return comment.user?.login === MANAGED_COMMENT_AUTHOR;
      }

      function defaultManagedBranch(prNumber) {
        return `external-contributor-pr-${prNumber}`;
      }

      function sanitizeManagedBranch(prNumber, branch) {
        const fallback = defaultManagedBranch(prNumber);
        if (!branch) return fallback;
        const allowed = new RegExp(`^external-contributor-pr-${prNumber}(?:-[A-Za-z0-9._-]+)?$`);
        return allowed.test(branch) ? branch : fallback;
      }

      async function upsertComment(github, context, issueNumber, marker, lines) {
        const comments = await listComments(github, context, issueNumber);
        const body = [marker, ...lines].join('\n');
        const existing = comments.find((comment) => isManagedComment(comment) && comment.body?.includes(marker));
        if (!existing) {
          await github.rest.issues.createComment({ owner: context.repo.owner, repo: context.repo.repo, issue_number: issueNumber, body });
          return;
        }
        if (existing.body !== body) {
          await github.rest.issues.updateComment({ owner: context.repo.owner, repo: context.repo.repo, comment_id: existing.id, body });
        }
      }

      async function syncLabels(github, context, issueNumber, desiredLabels) {
        const { data: issue } = await github.rest.issues.get({
          owner: context.repo.owner,
          repo: context.repo.repo,
          issue_number: issueNumber,
        });
        const existingNames = issue.labels.map((label) => typeof label === 'string' ? label : label.name).filter(Boolean);
        const preserved = existingNames.filter((label) => !MANAGED_LABELS.has(label));
        await github.rest.issues.setLabels({
          owner: context.repo.owner,
          repo: context.repo.repo,
          issue_number: issueNumber,
          labels: [...preserved, ...desiredLabels],
        });
      }

      async function findLatestClaim(github, context, issueNumber) {
        const comments = await listComments(github, context, issueNumber);
        return [...comments]
          .reverse()
          .map((comment) => {
            if (!isManagedComment(comment)) return null;
            const match = comment.body?.match(CLAIM_RE);
            if (!match) return null;
            const sourcePrNumber = issueNumber;
            return {
              ownedPrNumber: Number(match[1]),
              sourceSha: match[2],
              claimer: match[3],
              branch: sanitizeManagedBranch(sourcePrNumber, match[4]),
            };
          })
          .find(Boolean);
      }

      async function externalLifecycle({ github, context }) {
        const pr = context.payload.pull_request;
        await ensureLabels(github, context);

        if (context.payload.action === 'opened' || context.payload.action === 'reopened') {
          await upsertComment(github, context, pr.number, NOTICE_MARKER, NOTICE_LINES);
          const latestClaim = await findLatestClaim(github, context, pr.number);
          if (context.payload.action === 'reopened' && latestClaim && latestClaim.sourceSha === pr.head.sha) {
            const { data: ownedPr } = await github.rest.pulls.get({
              owner: context.repo.owner,
              repo: context.repo.repo,
              pull_number: latestClaim.ownedPrNumber,
            });
            if (ownedPr.state === 'open') {
              await syncLabels(github, context, pr.number, ['external-contributor', 'external-contributor:mirrored']);
              await github.rest.issues.createComment({
                owner: context.repo.owner,
                repo: context.repo.repo,
                issue_number: pr.number,
                body: `This external contributor PR is already mirrored to ${ownedPr.html_url}. Closing it again so discussion stays on the internal PR until fresh commits require another approval.`,
              });
              await github.rest.pulls.update({ owner: context.repo.owner, repo: context.repo.repo, pull_number: pr.number, state: 'closed' });
              return;
            }
          }
          await syncLabels(github, context, pr.number, ['external-contributor', 'external-contributor:awaiting-approval']);
          return;
        }

        const latestClaim = await findLatestClaim(github, context, pr.number);
        if (!latestClaim || latestClaim.sourceSha === pr.head.sha) return;

        const { data: ownedPr } = await github.rest.pulls.get({
          owner: context.repo.owner,
          repo: context.repo.repo,
          pull_number: latestClaim.ownedPrNumber,
        });
        if (ownedPr.state !== 'open') return;

        await syncLabels(github, context, pr.number, ['external-contributor', 'external-contributor:awaiting-approval']);
        await syncLabels(github, context, ownedPr.number, ['external-contributor', 'external-contributor:stale']);
        await upsertComment(github, context, ownedPr.number, '<!-- external-contributor-pr:owned-status -->', [
          `This mirrored PR is stale because the original external contributor PR #${pr.number} received new commits (\`${latestClaim.sourceSha}\` -> \`${pr.head.sha}\`).`,
          `Original PR: ${pr.html_url}`,
          '',
          'Approve the latest external commit to refresh this same internal PR in place.',
        ]);
        if (pr.state === 'closed') {
          await github.rest.pulls.update({ owner: context.repo.owner, repo: context.repo.repo, pull_number: pr.number, state: 'open' });
        }
        await github.rest.issues.createComment({
          owner: context.repo.owner,
          repo: context.repo.repo,
          issue_number: ownedPr.number,
          body: `New commits landed on external contributor PR #${pr.number} (\`${latestClaim.sourceSha}\` -> \`${pr.head.sha}\`). This mirrored PR stays open but is now stale until the latest external commit is approved and copied over.`,
        });
        await github.rest.issues.createComment({
          owner: context.repo.owner,
          repo: context.repo.repo,
          issue_number: pr.number,
          body: `New commits were pushed to this external contributor PR (\`${latestClaim.sourceSha}\` -> \`${pr.head.sha}\`). The mirrored PR ${ownedPr.html_url} remains open but is marked stale. A stagehand team member with write access must approve the latest commit to refresh that internal PR.`,
        });
      }

      async function prepareClaim({ github, context, core, artifactPath }) {
        const fs = require('fs');
        const handoff = JSON.parse(fs.readFileSync(artifactPath, 'utf8'));
        core.setOutput('should-claim', 'false');
        if (!handoff.shouldClaim || !handoff.prNumber || !handoff.reviewer || !handoff.approvedSha) return;

        const { data: pr } = await github.rest.pulls.get({
          owner: context.repo.owner,
          repo: context.repo.repo,
          pull_number: Number(handoff.prNumber),
        });
        if (pr.head.repo.full_name === context.payload.repository.full_name || pr.state !== 'open') return;

        const { data: permission } = await github.rest.repos.getCollaboratorPermissionLevel({
          owner: context.repo.owner,
          repo: context.repo.repo,
          username: handoff.reviewer,
        });
        if (!new Set(['admin', 'maintain', 'write']).has(permission.permission)) {
          await github.rest.issues.createComment({
            owner: context.repo.owner,
            repo: context.repo.repo,
            issue_number: pr.number,
            body: `@${handoff.reviewer} submitted an approving review, but only stagehand team members with write access can claim external contributor PRs. A maintainer with write access must approve the latest commit to proceed.`,
          });
          return;
        }
        if (pr.head.sha !== handoff.approvedSha) return;

        const latestClaim = await findLatestClaim(github, context, pr.number);
        const branch = sanitizeManagedBranch(pr.number, latestClaim?.branch);
        const title = `[Claimed #${pr.number}] ${pr.title}`;
        const body = [
          `Mirrored from external contributor PR #${pr.number} after approval by @${handoff.reviewer}.`,
          '',
          `Original author: @${pr.user.login}`,
          `Original PR: ${pr.html_url}`,
          `Approved source head SHA: \`${pr.head.sha}\``,
          '',
          `@${pr.user.login}, please continue any follow-up discussion on this mirrored PR. When the external PR gets new commits, this same internal PR will be marked stale until the latest external commit is approved and refreshed here.`,
          '',
          '## Original description',
          pr.body?.trim() || '_No description provided._',
          '',
          `<!-- external-contributor-pr:owned source-pr=${pr.number} source-sha=${pr.head.sha} claimer=${handoff.reviewer} -->`,
        ].join('\n');

        const { data: ownedPrs } = await github.rest.pulls.list({
          owner: context.repo.owner,
          repo: context.repo.repo,
          state: 'all',
          head: `${context.repo.owner}:${branch}`,
          base: 'main',
          per_page: 100,
        });

        core.setOutput('should-claim', 'true');
        core.setOutput('claimer', handoff.reviewer);
        core.setOutput('pr-number', String(pr.number));
        core.setOutput('source-sha', pr.head.sha);
        core.setOutput('previous-source-sha', latestClaim?.sourceSha || '');
        core.setOutput('branch', branch);
        core.setOutput('title', title);
        core.setOutput('body', body);
        core.setOutput('owned-pr-number', ownedPrs[0] ? String(ownedPrs[0].number) : '');
        core.setOutput('owned-pr-merged', ownedPrs[0]?.merged_at ? 'true' : 'false');
      }

      async function finalizeClaim({ github, context, input }) {
        await ensureLabels(github, context);
        const {
          prNumber,
          sourceSha,
          branch,
          claimer,
          title,
          body,
          existingNumber,
          existingMerged,
          refreshStatus,
          refreshReason,
        } = input;

        if (refreshStatus !== 'updated') {
          if (existingNumber) {
            await syncLabels(github, context, Number(existingNumber), ['external-contributor', 'external-contributor:stale']);
            await upsertComment(github, context, Number(existingNumber), '<!-- external-contributor-pr:owned-status -->', [
              `This mirrored PR could not be refreshed automatically after approval by @${claimer}.`,
              '',
              `Refresh reason: \`${refreshReason || 'unknown'}\``,
              'Resolve the branch manually, then keep using this same mirrored PR.',
            ]);
          }
          await syncLabels(github, context, prNumber, ['external-contributor', 'external-contributor:awaiting-approval']);
          await github.rest.issues.createComment({
            owner: context.repo.owner,
            repo: context.repo.repo,
            issue_number: prNumber,
            body: `The latest approval by @${claimer} could not refresh the mirrored PR automatically (${refreshReason || 'unknown reason'}). The external PR stays open, and the mirrored PR should be updated manually before work continues.`,
          });
          return;
        }

        let ownedPr;
        if (existingNumber && !existingMerged) {
          const { data } = await github.rest.pulls.update({
            owner: context.repo.owner,
            repo: context.repo.repo,
            pull_number: Number(existingNumber),
            title,
            body,
            base: 'main',
            state: 'open',
          });
          ownedPr = data;
        } else {
          const { data } = await github.rest.pulls.create({
            owner: context.repo.owner,
            repo: context.repo.repo,
            title,
            body,
            head: branch,
            base: 'main',
          });
          ownedPr = data;
        }

        await github.rest.issues.addAssignees({
          owner: context.repo.owner,
          repo: context.repo.repo,
          issue_number: ownedPr.number,
          assignees: [claimer],
        });
        await syncLabels(github, context, prNumber, ['external-contributor', 'external-contributor:mirrored']);
        await syncLabels(github, context, ownedPr.number, ['external-contributor', 'external-contributor:mirrored']);
        await upsertComment(github, context, ownedPr.number, '<!-- external-contributor-pr:owned-status -->', [
          `This mirrored PR tracks external contributor PR #${prNumber} at source SHA \`${sourceSha}\`, approved by @${claimer}.`,
          `Original PR: ${context.serverUrl}/${context.repo.owner}/${context.repo.repo}/pull/${prNumber}`,
          '',
          'When the external PR gets new commits, this same internal PR will be refreshed in place after the latest external commit is approved.',
        ]);

        const marker = `<!-- external-contributor-pr:claim owned-pr=${ownedPr.number} source-sha=${sourceSha} claimer=${claimer} branch=${branch} -->`;
        const comments = await listComments(github, context, prNumber);
        if (!comments.some((comment) => comment.body?.includes(marker))) {
          await github.rest.issues.createComment({
            owner: context.repo.owner,
            repo: context.repo.repo,
            issue_number: prNumber,
            body: [marker, `This PR was approved by @${claimer} and mirrored to ${ownedPr.html_url}. All further discussion should happen on that PR.`].join('\n'),
          });
        }

        const { data: externalPr } = await github.rest.pulls.get({
          owner: context.repo.owner,
          repo: context.repo.repo,
          pull_number: prNumber,
        });
        if (externalPr.state !== 'closed') {
          await github.rest.pulls.update({ owner: context.repo.owner, repo: context.repo.repo, pull_number: prNumber, state: 'closed' });
        }
      }

      async function syncOwnedPr({ github, context }) {
        const pr = context.payload.pull_request;
        const match = pr.body?.match(OWNED_RE);
        if (!match) return;

        const sourcePrNumber = Number(match[1]);
        const sourceSha = match[2];
        await ensureLabels(github, context);

        const { data: externalPr } = await github.rest.pulls.get({
          owner: context.repo.owner,
          repo: context.repo.repo,
          pull_number: sourcePrNumber,
        });

        if (context.payload.action === 'reopened') {
          await syncLabels(github, context, pr.number, ['external-contributor', 'external-contributor:mirrored']);
          await syncLabels(github, context, sourcePrNumber, ['external-contributor', 'external-contributor:mirrored']);
          if (externalPr.state !== 'closed') {
            await github.rest.pulls.update({ owner: context.repo.owner, repo: context.repo.repo, pull_number: sourcePrNumber, state: 'closed' });
          }
          return;
        }

        if (pr.merged) {
          await syncLabels(github, context, pr.number, ['external-contributor', 'external-contributor:completed']);
          await syncLabels(github, context, sourcePrNumber, ['external-contributor', 'external-contributor:completed']);
          await upsertComment(github, context, pr.number, '<!-- external-contributor-pr:owned-status -->', [
            `This mirrored PR has been merged into \`main\`. The original external PR ${externalPr.html_url} is now completed.`,
          ]);
          await upsertComment(github, context, sourcePrNumber, `<!-- external-contributor-pr:completed owned-pr=${pr.number} -->`, [
            `The mirrored PR ${pr.html_url} has been merged into \`main\`. This original external contributor PR will stay closed as completed.`,
          ]);
          return;
        }

        await syncLabels(github, context, pr.number, ['external-contributor', 'external-contributor:stale']);
        await syncLabels(github, context, sourcePrNumber, ['external-contributor', 'external-contributor:awaiting-approval']);
        if (externalPr.head.sha !== sourceSha) {
          await upsertComment(github, context, pr.number, '<!-- external-contributor-pr:owned-status -->', [
            `This mirrored PR is stale because the original external PR ${externalPr.html_url} now points at a different source SHA.`,
            'Approve the latest external commit to refresh this same internal PR.',
          ]);
          return;
        }

        if (externalPr.state === 'closed') {
          await github.rest.pulls.update({ owner: context.repo.owner, repo: context.repo.repo, pull_number: sourcePrNumber, state: 'open' });
        }
        await upsertComment(github, context, sourcePrNumber, `<!-- external-contributor-pr:owned-closed owned-pr=${pr.number} -->`, [
          `The mirrored PR ${pr.html_url} was closed without merge. This original PR has been reopened and is awaiting a fresh approving review from a stagehand team member with write access.`,
        ]);
        await upsertComment(github, context, pr.number, '<!-- external-contributor-pr:owned-status -->', [
          `This mirrored PR was closed without merge. The original external PR ${externalPr.html_url} has been reopened and relabeled as awaiting approval.`,
        ]);
      }

      return { externalLifecycle, prepareClaim, finalizeClaim, syncOwnedPr };
    })()

concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.event.workflow_run.id }}
  cancel-in-progress: false

jobs:
  manage-external-pr:
    if: github.event_name == 'pull_request_target' && github.event.pull_request.head.repo.full_name != github.repository
    runs-on: ubuntu-latest
    steps:
      - name: Sync external PR lifecycle
        if: github.event.action == 'opened' || github.event.action == 'reopened' || github.event.action == 'synchronize'
        uses: actions/github-script@v7
        with:
          github-token: ${{ secrets.GITHUB_TOKEN }}
          script: |
            const lib = eval(process.env.ECPR_LIB);
            await lib.externalLifecycle({ github, context });

  claim-approved-pr:
    if: github.event_name == 'workflow_run' && github.event.workflow_run.conclusion == 'success'
    runs-on: ubuntu-latest
    steps:
      - name: Download approval handoff artifact
        uses: actions/download-artifact@v4
        with:
          name: approved-review
          path: approval-handoff
          github-token: ${{ secrets.GITHUB_TOKEN }}
          repository: ${{ github.repository }}
          run-id: ${{ github.event.workflow_run.id }}

      - name: Prepare approved claim
        id: prepare-claim
        uses: actions/github-script@v7
        with:
          github-token: ${{ secrets.GITHUB_TOKEN }}
          script: |
            const lib = eval(process.env.ECPR_LIB);
            await lib.prepareClaim({ github, context, core, artifactPath: 'approval-handoff/approval-handoff.json' });

      - name: Checkout repository for branch operations
        if: steps.prepare-claim.outputs.should-claim == 'true'
        uses: actions/checkout@v4
        with:
          fetch-depth: 0
          persist-credentials: true

      - name: Refresh internal branch
        if: steps.prepare-claim.outputs.should-claim == 'true'
        id: refresh-branch
        continue-on-error: true
        env:
          INTERNAL_BRANCH: ${{ steps.prepare-claim.outputs.branch }}
          PR_NUMBER: ${{ steps.prepare-claim.outputs.pr-number }}
          PREVIOUS_SOURCE_SHA: ${{ steps.prepare-claim.outputs.previous-source-sha }}
          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        run: |
          set -uo pipefail

          refresh_status="conflict"
          refresh_reason="unknown"

          write_outputs() {
            echo "refresh-status=${refresh_status}" >> "$GITHUB_OUTPUT"
            if [ -n "${refresh_reason}" ]; then
              echo "reason=${refresh_reason}" >> "$GITHUB_OUTPUT"
            fi
          }

          trap write_outputs EXIT

          if ! git config user.name "github-actions[bot]"; then
            refresh_reason="git-config-failed"
            exit 0
          fi

          if ! git config user.email "41898282+github-actions[bot]@users.noreply.github.com"; then
            refresh_reason="git-config-failed"
            exit 0
          fi

          if ! git remote set-url origin "https://x-access-token:${GH_TOKEN}@github.com/${GITHUB_REPOSITORY}.git"; then
            refresh_reason="remote-auth-failed"
            exit 0
          fi

          if ! git fetch origin "pull/${PR_NUMBER}/head:refs/remotes/origin/external-pr-head-${PR_NUMBER}"; then
            refresh_reason="fetch-external-failed"
            exit 0
          fi

          external_ref="refs/remotes/origin/external-pr-head-${PR_NUMBER}"
          branch_exists=false
          if git ls-remote --exit-code --heads origin "${INTERNAL_BRANCH}" >/dev/null 2>&1; then
            branch_exists=true
            if ! git fetch origin "${INTERNAL_BRANCH}:refs/remotes/origin/${INTERNAL_BRANCH}"; then
              refresh_reason="fetch-internal-failed"
              exit 0
            fi
          fi

          if [ "${branch_exists}" = false ]; then
            if ! git checkout -B "${INTERNAL_BRANCH}" "${external_ref}"; then
              refresh_reason="checkout-failed"
              exit 0
            fi

            if ! git push --force-with-lease origin "HEAD:refs/heads/${INTERNAL_BRANCH}"; then
              refresh_reason="push-failed"
              exit 0
            fi

            refresh_status="updated"
            refresh_reason=""
            exit 0
          fi

          if ! git checkout -B "${INTERNAL_BRANCH}" "refs/remotes/origin/${INTERNAL_BRANCH}"; then
            refresh_reason="checkout-failed"
            exit 0
          fi

          if [ -z "${PREVIOUS_SOURCE_SHA}" ]; then
            refresh_reason="missing-previous-source"
            exit 0
          fi

          if git rebase --onto "${external_ref}" "${PREVIOUS_SOURCE_SHA}" "${INTERNAL_BRANCH}"; then
            if ! git push --force-with-lease origin "HEAD:refs/heads/${INTERNAL_BRANCH}"; then
              refresh_reason="push-failed"
              exit 0
            fi

            refresh_status="updated"
            refresh_reason=""
            exit 0
          fi

          git rebase --abort || true
          refresh_reason="rebase-conflict"

      - name: Finalize approved claim
        if: always() && steps.prepare-claim.outputs.should-claim == 'true'
        uses: actions/github-script@v7
        with:
          github-token: ${{ secrets.GITHUB_TOKEN }}
          script: |
            const lib = eval(process.env.ECPR_LIB);
            await lib.finalizeClaim({
              github,
              context,
              input: {
                prNumber: Number('${{ steps.prepare-claim.outputs.pr-number }}'),
                sourceSha: ${{ toJson(steps.prepare-claim.outputs.source-sha) }},
                branch: ${{ toJson(steps.prepare-claim.outputs.branch) }},
                claimer: ${{ toJson(steps.prepare-claim.outputs.claimer) }},
                title: ${{ toJson(steps.prepare-claim.outputs.title) }},
                body: ${{ toJson(steps.prepare-claim.outputs.body) }},
                existingNumber: ${{ toJson(steps.prepare-claim.outputs.owned-pr-number) }},
                existingMerged: '${{ steps.prepare-claim.outputs.owned-pr-merged }}' === 'true',
                refreshStatus: ${{ toJson(steps.refresh-branch.outputs.refresh-status) }},
                refreshReason: ${{ toJson(steps.refresh-branch.outputs.reason) }},
              },
            });

  sync-owned-pr:
    if: github.event_name == 'pull_request_target' && github.event.pull_request.head.repo.full_name == github.repository && (github.event.action == 'closed' || github.event.action == 'reopened')
    runs-on: ubuntu-latest
    steps:
      - name: Sync mirrored PR lifecycle
        uses: actions/github-script@v7
        with:
          github-token: ${{ secrets.GITHUB_TOKEN }}
          script: |
            const lib = eval(process.env.ECPR_LIB);
            await lib.syncOwnedPr({ github, context });


================================================
FILE: .github/workflows/feature-parity.yml
================================================
name: Feature Parity

on:
  pull_request:
    types:
      - opened
      - synchronize
      - labeled
      - unlabeled
    paths-ignore:
      - "packages/docs/**"

jobs:
  check-parity-label:
    runs-on: ubuntu-latest
    if: github.event.action == 'labeled' && github.event.label.name == 'parity'
    permissions:
      contents: read
      pull-requests: write
      issues: write
    steps:
      - name: Check out repository code
        uses: actions/checkout@v4

      - name: Check user permissions
        uses: actions/github-script@v7
        with:
          github-token: ${{ secrets.GITHUB_TOKEN }}
          script: |
            const { data: permission } = await github.rest.repos.getCollaboratorPermissionLevel({
              owner: context.repo.owner,
              repo: context.repo.repo,
              username: context.actor
            });

            const hasWriteAccess = ['admin', 'write'].includes(permission.permission);

            if (!hasWriteAccess) {
              // Remove the parity label if user doesn't have write access
              await github.rest.issues.removeLabel({
                owner: context.repo.owner,
                repo: context.repo.repo,
                issue_number: context.issue.number,
                name: 'parity'
              });

              // Add a comment explaining why the label was removed
              await github.rest.issues.createComment({
                owner: context.repo.owner,
                repo: context.repo.repo,
                issue_number: context.issue.number,
                body: `❌ **Parity Label Removed**\n\n@${context.actor}, you do not have sufficient permissions to add the 'parity' label. Only users with write access can trigger feature parity issues.\n\nIf you believe this feature should be implemented in the Python SDK, please ask a maintainer to add the label.`
              });

              throw new Error(`User ${context.actor} does not have write access to add parity label`);
            }

            console.log(`User ${context.actor} has ${permission.permission} access - proceeding with parity workflow`);

      - name: Generate GitHub App token
        id: generate-token
        uses: actions/create-github-app-token@v1
        with:
          app-id: ${{ secrets.PARITY_APP_ID }}
          private-key: ${{ secrets.PARITY_APP_PRIVATE_KEY }}
          owner: browserbase
          repositories: stagehand

      - name: Create issue in Python SDK repository
        uses: actions/github-script@v7
        with:
          github-token: ${{ steps.generate-token.outputs.token }}
          script: |
            const { data: pullRequest } = await github.rest.pulls.get({
              owner: context.repo.owner,
              repo: context.repo.repo,
              pull_number: context.issue.number,
            });

            // Get PR comments for additional context
            const { data: comments } = await github.rest.issues.listComments({
              owner: context.repo.owner,
              repo: context.repo.repo,
              issue_number: context.issue.number,
            });

            // Format comments for the issue description
            let commentsSection = '';
            if (comments.length > 0) {
              commentsSection = '\n\n## Recent Comments\n\n';
              comments.slice(-3).forEach(comment => {
                commentsSection += `**@${comment.user.login}** commented:\n`;
                commentsSection += `${comment.body.substring(0, 500)}${comment.body.length > 500 ? '...' : ''}\n\n`;
              });
            }

            // Get list of changed files for context
            const { data: files } = await github.rest.pulls.listFiles({
              owner: context.repo.owner,
              repo: context.repo.repo,
              pull_number: context.issue.number,
            });

            const changedFiles = files.map(file => `- \`${file.filename}\``).join('\n');

            const issueTitle = `[Feature Parity] ${pullRequest.title}`;
            const issueBody = `## Feature Parity Request

            This issue was automatically created from a pull request in the TypeScript Stagehand repository that was labeled with 'parity'.

            ### Original PR Details
            - **PR**: #${context.issue.number} - ${pullRequest.title}
            - **Author**: @${pullRequest.user.login}
            - **Link**: ${pullRequest.html_url}

            ### Description
            ${pullRequest.body || 'No description provided.'}

            ### Changed Files
            ${changedFiles}

            ${commentsSection}

            ### Action Required
            Please review the changes in the original PR and implement equivalent functionality in the Python SDK if applicable.

            ---
            *This issue was automatically generated by the Feature Parity workflow.*`;

            // Create the issue in the Python repository
            const { data: issue } = await github.rest.issues.create({
              owner: 'browserbase',
              repo: 'stagehand-python',
              title: issueTitle,
              body: issueBody,
              labels: ['parity']
            });

            console.log(`Created issue: ${issue.html_url}`);

            // Add a comment to the original PR confirming the issue was created
            await github.rest.issues.createComment({
              owner: context.repo.owner,
              repo: context.repo.repo,
              issue_number: context.issue.number,
              body: `🔄 **Feature Parity Issue Created**\n\nAn issue has been automatically created in the Python SDK repository to track parity implementation:\n${issue.html_url}`
            });


================================================
FILE: .github/workflows/release.yml
================================================
name: Release

on:
  push:
    branches:
      - main

permissions:
  contents: write
  pull-requests: write
  id-token: write

concurrency: ${{ github.workflow }}-${{ github.ref }}

jobs:
  release:
    name: Release
    runs-on: ubuntu-latest
    steps:
      - name: Checkout Repo
        uses: actions/checkout@v6
        with:
          fetch-depth: 0

      - uses: ./.github/actions/setup-node-pnpm-turbo
        with:
          use-prebuilt-artifacts: "false"

      - name: Configure npm registry for Trusted Publishing
        uses: actions/setup-node@v6
        with:
          node-version: 20.x
          registry-url: "https://registry.npmjs.org"

      - name: Update npm for Trusted Publishing
        run: npm install -g npm@latest

      - name: Run Lint & Build
        run: pnpm exec turbo run lint && pnpm exec turbo run build

      - name: Create Release Pull Request or Publish to npm
        id: changesets
        uses: changesets/action@v1
        with:
          publish: pnpm run release
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}

      - name: Publish Canary
        if: github.ref == 'refs/heads/main'
        run: |
          git checkout main
          pnpm run release-canary
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}


================================================
FILE: .github/workflows/stagehand-server-v3-release.yml
================================================
name: Release stagehand/server-v3

on:
  push:
    branches:
      - main
    paths:
      - .changeset/**
  workflow_dispatch:

permissions:
  contents: write

concurrency: ${{ github.workflow }}-${{ github.ref }}

env:
  OAS_PATH: packages/server-v3/openapi.v3.yaml

jobs:
  detect:
    name: Detect server-v3 release (changesets)
    runs-on: ubuntu-latest
    outputs:
      release: ${{ steps.meta.outputs.release }}
      version: ${{ steps.meta.outputs.version }}
      tag: ${{ steps.meta.outputs.tag }}
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4
        with:
          fetch-depth: 1
          fetch-tags: true

      - uses: ./.github/actions/setup-node-pnpm-turbo
        env:
          PLAYWRIGHT_SKIP_BROWSER_DOWNLOAD: "1"
        with:
          use-prebuilt-artifacts: "false"

      - name: Determine release metadata
        id: meta
        shell: bash
        run: |
          set -euo pipefail

          latest_tag="$(git tag -l 'stagehand-server-v3/v*' --sort=-v:refname | head -n 1 || true)"
          rm -f changeset-status.json
          if [ -n "${latest_tag}" ]; then
            pnpm changeset status --since "${latest_tag}" --output changeset-status.json
          else
            pnpm changeset status --output changeset-status.json
          fi

          node <<'NODE'
          const fs = require('fs');

          const status = JSON.parse(fs.readFileSync('changeset-status.json', 'utf8'));
          const changesets = Array.isArray(status.changesets) ? status.changesets : [];
          const releases = Array.isArray(status.releases) ? status.releases : [];

          const shouldRelease = changesets.some((cs) =>
            (cs.releases || []).some((r) => r?.name === '@browserbasehq/stagehand-server-v3')
          );

          const serverRelease = releases.find((r) => r?.name === '@browserbasehq/stagehand-server-v3');
          if (shouldRelease && !serverRelease?.newVersion) {
            throw new Error(
              'Expected @browserbasehq/stagehand-server-v3 to have a computed newVersion in changeset-status.json.'
            );
          }

          const release = shouldRelease ? 'true' : 'false';
          const version = shouldRelease ? serverRelease.newVersion : '';
          const tag = `stagehand-server-v3/v${version}`;

          const out = process.env.GITHUB_OUTPUT;
          fs.appendFileSync(out, `release=${release}\n`);
          fs.appendFileSync(out, `version=${version}\n`);
          fs.appendFileSync(out, `tag=${tag}\n`);
          NODE

      - name: Create stagehand/server-v3 tag
        if: steps.meta.outputs.release == 'true'
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        shell: bash
        run: |
          set -euo pipefail

          TAG="${{ steps.meta.outputs.tag }}"
          VERSION="${{ steps.meta.outputs.version }}"
          TARGET_SHA="${{ github.sha }}"

          git config user.name "github-actions[bot]"
          git config user.email "41898282+github-actions[bot]@users.noreply.github.com"

          # Try to fetch the tag if it exists on remote; ignore failure for new tags
          git fetch --force origin "refs/tags/${TAG}:refs/tags/${TAG}" 2>/dev/null || true
          if git rev-parse -q --verify "refs/tags/${TAG}" >/dev/null; then
            echo "Tag already exists: ${TAG}"
            exit 0
          fi

          git tag -a "${TAG}" "${TARGET_SHA}" -m "stagehand/server-v3 v${VERSION}"
          git push origin "${TAG}"

  build_binaries:
    name: Build SEA binaries
    needs: detect
    if: needs.detect.outputs.release == 'true'
    uses: ./.github/workflows/stagehand-server-v3-sea-build.yml
    with:
      matrix: |
        [
          {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v3-linux-x64","include_sourcemaps":false},
          {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v3-linux-arm64","include_sourcemaps":false},
          {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v3-darwin-arm64","include_sourcemaps":false},
          {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v3-darwin-x64","include_sourcemaps":false},
          {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v3-win32-x64.exe","include_sourcemaps":false},
          {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v3-win32-arm64.exe","include_sourcemaps":false}
        ]

  release:
    name: Publish GitHub Release
    needs: [detect, build_binaries]
    if: needs.detect.outputs.release == 'true'
    runs-on: ubuntu-latest
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4
        with:
          fetch-depth: 1
          fetch-tags: false

      - name: Prepare release assets directory
        run: mkdir -p release-assets

      - name: Prepare stagehand/server-v3 release assets
        run: |
          set -euo pipefail
          cp "${{ env.OAS_PATH }}" "release-assets/openapi.v3.stagehand-server-v3-${{ needs.detect.outputs.version }}.yaml"

      - name: Download SEA binary artifacts
        uses: actions/download-artifact@v4
        with:
          pattern: stagehand-server-v3-*
          path: .
          merge-multiple: true

      - name: Collect SEA binaries
        shell: bash
        run: |
          set -euo pipefail
          shopt -s nullglob
          for f in packages/server-v3/dist/sea/stagehand-server-v3-*; do
            cp "$f" release-assets/
          done

      - name: Create checksums
        shell: bash
        run: |
          set -euo pipefail
          cd release-assets
          # Only checksum binaries (exclude openapi yaml). Avoid failing if no matches.
          shopt -s nullglob
          files=(stagehand-server-v3-*)
          bins=()
          for f in "${files[@]}"; do
            [[ "$f" == *openapi* ]] && continue
            [[ -f "$f" ]] && bins+=("$f")
          done
          : > checksums.sha256
          if [ "${#bins[@]}" -gt 0 ]; then
            shasum -a 256 "${bins[@]}" > checksums.sha256
          fi

      - name: Publish stagehand/server-v3 GitHub release
        uses: softprops/action-gh-release@v2
        with:
          tag_name: ${{ needs.detect.outputs.tag }}
          name: stagehand/server-v3 v${{ needs.detect.outputs.version }}
          generate_release_notes: true
          files: |
            release-assets/openapi.v3.stagehand-server-v3-${{ needs.detect.outputs.version }}.yaml
            release-assets/stagehand-server-v3-*
            release-assets/checksums.sha256


================================================
FILE: .github/workflows/stagehand-server-v3-sea-build.yml
================================================
name: Stagehand Server v3 SEA Build

on:
  workflow_call:
    inputs:
      matrix:
        description: "JSON matrix include list for SEA binaries."
        required: false
        type: string
        default: |
          [
            {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v3-linux-x64","include_sourcemaps":false},
            {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v3-linux-arm64","include_sourcemaps":false},
            {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v3-darwin-arm64","include_sourcemaps":false},
            {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v3-darwin-x64","include_sourcemaps":false},
            {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v3-win32-x64.exe","include_sourcemaps":false},
            {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v3-win32-arm64.exe","include_sourcemaps":false}
          ]
      use-prebuilt-artifacts:
        description: "Whether to download pre-built package artifacts."
        required: false
        type: string
        default: "false"
      restore-turbo-cache:
        description: "Whether to restore local .turbo cache."
        required: false
        type: string
        default: "true"
      node-version:
        description: "Node.js version for setup."
        required: false
        type: string
        default: "20.x"
      upload-only-binary:
        description: "Upload only this binary (empty => upload all)."
        required: false
        type: string
        default: ""
  workflow_dispatch:
    inputs:
      matrix:
        description: "JSON matrix include list for SEA binaries."
        required: false
        default: |
          [
            {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v3-linux-x64","include_sourcemaps":false},
            {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v3-linux-arm64","include_sourcemaps":false},
            {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v3-darwin-arm64","include_sourcemaps":false},
            {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v3-darwin-x64","include_sourcemaps":false},
            {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v3-win32-x64.exe","include_sourcemaps":false},
            {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v3-win32-arm64.exe","include_sourcemaps":false}
          ]
      use-prebuilt-artifacts:
        description: "Whether to download pre-built package artifacts."
        required: false
        type: string
        default: "false"
      restore-turbo-cache:
        description: "Whether to restore local .turbo cache."
        required: false
        type: string
        default: "true"
      node-version:
        description: "Node.js version for setup."
        required: false
        type: string
        default: "20.x"
      upload-only-binary:
        description: "Upload only this binary (empty => upload all)."
        required: false
        type: string
        default: ""

jobs:
  build_binaries:
    name: Build SEA binaries (${{ matrix.binary_name }})
    runs-on: ${{ matrix.os }}
    strategy:
      fail-fast: false
      matrix:
        include: ${{ fromJson(inputs.matrix) }}

    steps:
      - name: Checkout repository
        uses: actions/checkout@v6
        with:
          fetch-depth: 1
          fetch-tags: false

      - uses: ./.github/actions/setup-node-pnpm-turbo
        env:
          PLAYWRIGHT_SKIP_BROWSER_DOWNLOAD: "1"
          PLAYWRIGHT_SKIP_DOWNLOAD: "1"
          PUPPETEER_SKIP_DOWNLOAD: "1"
        with:
          use-prebuilt-artifacts: ${{ inputs.use-prebuilt-artifacts }}
          restore-turbo-cache: ${{ inputs.restore-turbo-cache }}
          node-version: ${{ inputs.node-version }}

      - name: Build SEA binary (ESM)
        env:
          SEA_TARGET_PLATFORM: ${{ matrix.platform }}
          SEA_TARGET_ARCH: ${{ matrix.arch }}
          SEA_BINARY_NAME: ${{ matrix.binary_name }}
          SEA_INCLUDE_SOURCEMAPS: ${{ matrix.include_sourcemaps && '1' || '0' }}
        run: pnpm exec turbo run build:sea:esm --filter=@browserbasehq/stagehand-server-v3

      - name: Verify SEA binary exists
        shell: bash
        run: |
          test -f "packages/server-v3/dist/sea/${{ matrix.binary_name }}"

      - name: Verify SEA binary launches cleanly
        shell: bash
        env:
          RUNNER_ARCH: ${{ runner.arch }}
        run: |
          set -euo pipefail

          binary="packages/server-v3/dist/sea/${{ matrix.binary_name }}"
          matrix_arch="${{ matrix.arch }}"
          runner_arch="$(echo "${RUNNER_ARCH}" | tr '[:upper:]' '[:lower:]')"

          if [[ "${matrix_arch}" != "${runner_arch}" ]]; then
            echo "Runner arch (${runner_arch}) does not match matrix arch (${matrix_arch})."
            echo "Launch verification must run on same-arch runners."
            exit 1
          fi

          if [[ "${{ matrix.platform }}" != "win32" ]]; then
            chmod +x "${binary}"
          fi

          port="$((30000 + RANDOM % 10000))"
          log_file="$(mktemp)"
          launched="false"

          cleanup() {
            if [[ -n "${pid:-}" ]] && kill -0 "${pid}" 2>/dev/null; then
              kill "${pid}" 2>/dev/null || true
              wait "${pid}" 2>/dev/null || true
            fi
          }
          trap cleanup EXIT

          PORT="${port}" "${binary}" >"${log_file}" 2>&1 &
          pid=$!

          for _ in {1..30}; do
            if ! kill -0 "${pid}" 2>/dev/null; then
              wait "${pid}" 2>/dev/null || true
              echo "SEA binary exited before becoming healthy."
              cat "${log_file}"
              exit 1
            fi

            if curl --silent --show-error --fail "http://127.0.0.1:${port}/healthz" >/dev/null; then
              launched="true"
              break
            fi

            sleep 1
          done

          if [[ "${launched}" != "true" ]]; then
            echo "SEA binary did not become healthy within 30 seconds."
            cat "${log_file}"
            exit 1
          fi

      - name: Upload artifact
        uses: actions/upload-artifact@v4
        if: ${{ inputs.upload-only-binary == '' || matrix.binary_name == inputs.upload-only-binary }}
        with:
          name: ${{ matrix.binary_name }}
          # package.json is included to anchor artifact paths at repo root.
          path: |
            package.json
            packages/server-v3/dist/sea/${{ matrix.binary_name }}
          retention-days: 7


================================================
FILE: .github/workflows/stagehand-server-v4-release.yml
================================================
name: Release stagehand/server-v4

on:
  push:
    branches:
      - main
    paths:
      - .changeset/**
  workflow_dispatch:

permissions:
  contents: write

concurrency: ${{ github.workflow }}-${{ github.ref }}

env:
  OAS_PATH: packages/server-v4/openapi.v4.yaml

jobs:
  detect:
    name: Detect server-v4 release (changesets)
    runs-on: ubuntu-latest
    outputs:
      release: ${{ steps.meta.outputs.release }}
      version: ${{ steps.meta.outputs.version }}
      tag: ${{ steps.meta.outputs.tag }}
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4
        with:
          fetch-depth: 1
          fetch-tags: true

      - uses: ./.github/actions/setup-node-pnpm-turbo
        env:
          PLAYWRIGHT_SKIP_BROWSER_DOWNLOAD: "1"
        with:
          use-prebuilt-artifacts: "false"

      - name: Determine release metadata
        id: meta
        shell: bash
        run: |
          set -euo pipefail

          latest_tag="$(git tag -l 'stagehand-server-v4/v*' --sort=-v:refname | head -n 1 || true)"
          rm -f changeset-status.json
          if [ -n "${latest_tag}" ]; then
            pnpm changeset status --since "${latest_tag}" --output changeset-status.json
          else
            pnpm changeset status --output changeset-status.json
          fi

          node <<'NODE'
          const fs = require('fs');

          const status = JSON.parse(fs.readFileSync('changeset-status.json', 'utf8'));
          const changesets = Array.isArray(status.changesets) ? status.changesets : [];
          const releases = Array.isArray(status.releases) ? status.releases : [];

          const shouldRelease = changesets.some((cs) =>
            (cs.releases || []).some((r) => r?.name === '@browserbasehq/stagehand-server-v4')
          );

          const serverRelease = releases.find((r) => r?.name === '@browserbasehq/stagehand-server-v4');
          if (shouldRelease && !serverRelease?.newVersion) {
            throw new Error(
              'Expected @browserbasehq/stagehand-server-v4 to have a computed newVersion in changeset-status.json.'
            );
          }

          const release = shouldRelease ? 'true' : 'false';
          const version = shouldRelease ? serverRelease.newVersion : '';
          const tag = `stagehand-server-v4/v${version}`;

          const out = process.env.GITHUB_OUTPUT;
          fs.appendFileSync(out, `release=${release}\n`);
          fs.appendFileSync(out, `version=${version}\n`);
          fs.appendFileSync(out, `tag=${tag}\n`);
          NODE

      - name: Create stagehand/server-v4 tag
        if: steps.meta.outputs.release == 'true'
        env:
          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
        shell: bash
        run: |
          set -euo pipefail

          TAG="${{ steps.meta.outputs.tag }}"
          VERSION="${{ steps.meta.outputs.version }}"
          TARGET_SHA="${{ github.sha }}"

          git config user.name "github-actions[bot]"
          git config user.email "41898282+github-actions[bot]@users.noreply.github.com"

          # Try to fetch the tag if it exists on remote; ignore failure for new tags
          git fetch --force origin "refs/tags/${TAG}:refs/tags/${TAG}" 2>/dev/null || true
          if git rev-parse -q --verify "refs/tags/${TAG}" >/dev/null; then
            echo "Tag already exists: ${TAG}"
            exit 0
          fi

          git tag -a "${TAG}" "${TARGET_SHA}" -m "stagehand/server-v4 v${VERSION}"
          git push origin "${TAG}"

  build_binaries:
    name: Build SEA binaries
    needs: detect
    if: needs.detect.outputs.release == 'true'
    uses: ./.github/workflows/stagehand-server-v4-sea-build.yml
    with:
      matrix: |
        [
          {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v4-linux-x64","include_sourcemaps":false},
          {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v4-linux-arm64","include_sourcemaps":false},
          {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v4-darwin-arm64","include_sourcemaps":false},
          {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v4-darwin-x64","include_sourcemaps":false},
          {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v4-win32-x64.exe","include_sourcemaps":false},
          {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v4-win32-arm64.exe","include_sourcemaps":false}
        ]

  release:
    name: Publish GitHub Release
    needs: [detect, build_binaries]
    if: needs.detect.outputs.release == 'true'
    runs-on: ubuntu-latest
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4
        with:
          fetch-depth: 1
          fetch-tags: false

      - name: Prepare release assets directory
        run: mkdir -p release-assets

      - name: Prepare stagehand/server-v4 release assets
        run: |
          set -euo pipefail
          cp "${{ env.OAS_PATH }}" "release-assets/openapi.v4.stagehand-server-v4-${{ needs.detect.outputs.version }}.yaml"

      - name: Download SEA binary artifacts
        uses: actions/download-artifact@v4
        with:
          pattern: stagehand-server-v4-*
          path: .
          merge-multiple: true

      - name: Collect SEA binaries
        shell: bash
        run: |
          set -euo pipefail
          shopt -s nullglob
          for f in packages/server-v4/dist/sea/stagehand-server-v4-*; do
            cp "$f" release-assets/
          done

      - name: Create checksums
        shell: bash
        run: |
          set -euo pipefail
          cd release-assets
          # Only checksum binaries (exclude openapi yaml). Avoid failing if no matches.
          shopt -s nullglob
          files=(stagehand-server-v4-*)
          bins=()
          for f in "${files[@]}"; do
            [[ "$f" == *openapi* ]] && continue
            [[ -f "$f" ]] && bins+=("$f")
          done
          : > checksums.sha256
          if [ "${#bins[@]}" -gt 0 ]; then
            shasum -a 256 "${bins[@]}" > checksums.sha256
          fi

      - name: Publish stagehand/server-v4 GitHub release
        uses: softprops/action-gh-release@v2
        with:
          tag_name: ${{ needs.detect.outputs.tag }}
          name: stagehand/server-v4 v${{ needs.detect.outputs.version }}
          generate_release_notes: true
          files: |
            release-assets/openapi.v4.stagehand-server-v4-${{ needs.detect.outputs.version }}.yaml
            release-assets/stagehand-server-v4-*
            release-assets/checksums.sha256


================================================
FILE: .github/workflows/stagehand-server-v4-sea-build.yml
================================================
name: Stagehand Server v4 SEA Build

on:
  workflow_call:
    inputs:
      matrix:
        description: "JSON matrix include list for SEA binaries."
        required: false
        type: string
        default: |
          [
            {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v4-linux-x64","include_sourcemaps":false},
            {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v4-linux-arm64","include_sourcemaps":false},
            {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v4-darwin-arm64","include_sourcemaps":false},
            {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v4-darwin-x64","include_sourcemaps":false},
            {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v4-win32-x64.exe","include_sourcemaps":false},
            {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v4-win32-arm64.exe","include_sourcemaps":false}
          ]
      use-prebuilt-artifacts:
        description: "Whether to download pre-built package artifacts."
        required: false
        type: string
        default: "false"
      restore-turbo-cache:
        description: "Whether to restore local .turbo cache."
        required: false
        type: string
        default: "true"
      node-version:
        description: "Node.js version for setup."
        required: false
        type: string
        default: "20.x"
      upload-only-binary:
        description: "Upload only this binary (empty => upload all)."
        required: false
        type: string
        default: ""
  workflow_dispatch:
    inputs:
      matrix:
        description: "JSON matrix include list for SEA binaries."
        required: false
        default: |
          [
            {"os":"ubuntu-latest","platform":"linux","arch":"x64","binary_name":"stagehand-server-v4-linux-x64","include_sourcemaps":false},
            {"os":"ubuntu-24.04-arm","platform":"linux","arch":"arm64","binary_name":"stagehand-server-v4-linux-arm64","include_sourcemaps":false},
            {"os":"macos-15","platform":"darwin","arch":"arm64","binary_name":"stagehand-server-v4-darwin-arm64","include_sourcemaps":false},
            {"os":"macos-15-intel","platform":"darwin","arch":"x64","binary_name":"stagehand-server-v4-darwin-x64","include_sourcemaps":false},
            {"os":"windows-latest","platform":"win32","arch":"x64","binary_name":"stagehand-server-v4-win32-x64.exe","include_sourcemaps":false},
            {"os":"windows-11-arm","platform":"win32","arch":"arm64","binary_name":"stagehand-server-v4-win32-arm64.exe","include_sourcemaps":false}
          ]
      use-prebuilt-artifacts:
        description: "Whether to download pre-built package artifacts."
        required: false
        type: string
        default: "false"
      restore-turbo-cache:
        description: "Whether to restore local .turbo cache."
        required: false
        type: string
        default: "true"
      node-version:
        description: "Node.js version for setup."
        required: false
        type: string
        default: "20.x"
      upload-only-binary:
        description: "Upload only this binary (empty => upload all)."
        required: false
        type: string
        default: ""

jobs:
  build_binaries:
    name: Build SEA binaries (${{ matrix.binary_name }})
    runs-on: ${{ matrix.os }}
    strategy:
      fail-fast: false
      matrix:
        include: ${{ fromJson(inputs.matrix) }}

    steps:
      - name: Checkout repository
        uses: actions/checkout@v6
        with:
          fetch-depth: 1
          fetch-tags: false

      - uses: ./.github/actions/setup-node-pnpm-turbo
        env:
          PLAYWRIGHT_SKIP_BROWSER_DOWNLOAD: "1"
          PLAYWRIGHT_SKIP_DOWNLOAD: "1"
          PUPPETEER_SKIP_DOWNLOAD: "1"
        with:
          use-prebuilt-artifacts: ${{ inputs.use-prebuilt-artifacts }}
          restore-turbo-cache: ${{ inputs.restore-turbo-cache }}
          node-version: ${{ inputs.node-version }}

      - name: Build SEA binary (ESM)
        env:
          SEA_TARGET_PLATFORM: ${{ matrix.platform }}
          SEA_TARGET_ARCH: ${{ matrix.arch }}
          SEA_BINARY_NAME: ${{ matrix.binary_name }}
          SEA_INCLUDE_SOURCEMAPS: ${{ matrix.include_sourcemaps && '1' || '0' }}
        run: pnpm exec turbo run build:sea:esm --filter=@browserbasehq/stagehand-server-v4

      - name: Verify SEA binary exists
        shell: bash
        run: |
          test -f "packages/server-v4/dist/sea/${{ matrix.binary_name }}"

      - name: Verify SEA binary launches cleanly
        shell: bash
        env:
          RUNNER_ARCH: ${{ runner.arch }}
        run: |
          set -euo pipefail

          binary="packages/server-v4/dist/sea/${{ matrix.binary_name }}"
          matrix_arch="${{ matrix.arch }}"
          runner_arch="$(echo "${RUNNER_ARCH}" | tr '[:upper:]' '[:lower:]')"

          if [[ "${matrix_arch}" != "${runner_arch}" ]]; then
            echo "Runner arch (${runner_arch}) does not match matrix arch (${matrix_arch})."
            echo "Launch verification must run on same-arch runners."
            exit 1
          fi

          if [[ "${{ matrix.platform }}" != "win32" ]]; then
            chmod +x "${binary}"
          fi

          port="$((30000 + RANDOM % 10000))"
          log_file="$(mktemp)"
          launched="false"

          cleanup() {
            if [[ -n "${pid:-}" ]] && kill -0 "${pid}" 2>/dev/null; then
              kill "${pid}" 2>/dev/null || true
              wait "${pid}" 2>/dev/null || true
            fi
          }
          trap cleanup EXIT

          PORT="${port}" "${binary}" >"${log_file}" 2>&1 &
          pid=$!

          for _ in {1..30}; do
            if ! kill -0 "${pid}" 2>/dev/null; then
              wait "${pid}" 2>/dev/null || true
              echo "SEA binary exited before becoming healthy."
              cat "${log_file}"
              exit 1
            fi

            if curl --silent --show-error --fail "http://127.0.0.1:${port}/healthz" >/dev/null; then
              launched="true"
              break
            fi

            sleep 1
          done

          if [[ "${launched}" != "true" ]]; then
            echo "SEA binary did not become healthy within 30 seconds."
            cat "${log_file}"
            exit 1
          fi

      - name: Upload artifact
        uses: actions/upload-artifact@v4
        if: ${{ inputs.upload-only-binary == '' || matrix.binary_name == inputs.upload-only-binary }}
        with:
          name: ${{ matrix.binary_name }}
          # package.json is included to anchor artifact paths at repo root.
          path: |
            package.json
            packages/server-v4/dist/sea/${{ matrix.binary_name }}
          retention-days: 7


================================================
FILE: .github/workflows/stainless.yml
================================================
name: Build SDKs for pull request

on:
  pull_request:
    types:
      - opened
      - synchronize
      - reopened
      - closed

concurrency:
  group: ${{ github.workflow }}-${{ github.event.pull_request.number }}
  cancel-in-progress: true

env:
  STAINLESS_ORG: ${{ vars.STAINLESS_ORG }}
  STAINLESS_PROJECT: ${{ vars.STAINLESS_PROJECT }}
  OAS_PATH: packages/server-v3/openapi.v3.yaml

jobs:
  preview:
    if: github.event.action != 'closed'
    runs-on: ubuntu-latest
    permissions:
      contents: read
      pull-requests: write
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4
        with:
          fetch-depth: 2

      - name: Run preview builds
        uses: stainless-api/upload-openapi-spec-action/preview@v1
        with:
          stainless_api_key: ${{ secrets.STAINLESS_API_KEY }}
          org: ${{ env.STAINLESS_ORG }}
          project: ${{ env.STAINLESS_PROJECT }}
          oas_path: ${{ env.OAS_PATH }}
          config_path: stainless.yml

  merge:
    if: github.event.action == 'closed' && github.event.pull_request.merged == true && github.event.pull_request.base.ref == 'main'
    runs-on: ubuntu-latest
    permissions:
      contents: read
      pull-requests: write
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4
        with:
          fetch-depth: 2
      - name: Run merge build
        uses: stainless-api/upload-openapi-spec-action/merge@v1
        with:
          stainless_api_key: ${{ secrets.STAINLESS_API_KEY }}
          org: ${{ env.STAINLESS_ORG }}
          project: ${{ env.STAINLESS_PROJECT }}
          oas_path: ${{ env.OAS_PATH }}
          config_path: stainless.yml


================================================
FILE: .gitignore
================================================
node_modules/
/test-results/
/playwright-report/
/blob-report/
/playwright/.cache/
screenshot.png
.DS_STORE
.cache/
.env
downloads/
dist/
.browserbase/
packages/evals/**/public
packages/core/lib/dom/build/
packages/core/lib/v3/dom/build/
packages/evals/public
*.tgz
evals/playground.ts
tmp/
eval-summary.json
package-lock.json
evals/deterministic/tests/BrowserContext/tmp-test.har
packages/core/lib/version.ts
packages/core/test-results/
/examples/inference_summary
/inference_summary
.turbo
.idea
coverage/
ctrf/
.stagehand-sea/


================================================
FILE: .prettierignore
================================================
pnpm-lock.yaml
README.md
**/*.json
docs/
.github/
dist/
node_modules/
lib/dom/build/
lib/v3/dom/build/
packages/core/dist/
packages/core/lib/dom/build/
packages/core/lib/v3/dom/build/
packages/cli/dist/
packages/evals/dist/
packages/docs/
*.min.js
.browserbase/
.browserbase/**
**/.browserbase/
**/.browserbase/**
stainless.yml
openapi.*.yaml


================================================
FILE: .prettierrc
================================================
{}


================================================
FILE: .vscode/settings.json
================================================
{
  "editor.defaultFormatter": "esbenp.prettier-vscode",
  "editor.formatOnSave": true
}


================================================
FILE: CHANGELOG.md
================================================
# @browserbasehq/stagehand

## 3.0.0

### Major Changes

- Removes internal Playwright dependency
- A generous 20-40% speed increase across `act`, `extract`, & `observe` calls
- Compatibility with Playwright, Puppeteer, and Patchright
- Automatic action caching (agent, stagehand.act). Go from CUA → deterministic scripts w/o inference
- A suite of non AI primitives:
  - `page`
  - `locator` (built in closed mode shadow root traversal, with xpaths & css selectors)
  - `frameLocator`
  - `deepLocator` (crosses iframes & shadow roots)
- bun compatibility
- Simplified extract schemas
- CSS selector support (id-based support coming soon)
- Targeted extract and observe across iframes & shadow roots
- More intuitive type names (observeResult is now action, act accepts an instruction string instead of an action string, solidified ModelConfiguration)

Check the [migration guide](https://docs.stagehand.dev/v3/migrations/v2) for more information

## 2.5.0

### Minor Changes

- [#981](https://github.com/browserbase/stagehand/pull/981) [`8244ab2`](https://github.com/browserbase/stagehand/commit/8244ab247cd679962685ae2f7c54e874ce1fa614) Thanks [@sameelarif](https://github.com/sameelarif)! - Added support for `stagehand.agent` to interact with MCP servers as well as custom tools to be passed in. For more information, reference the [MCP integrations documentation](https://docs.stagehand.dev/best-practices/mcp-integrations)

### Patch Changes

- [#959](https://github.com/browserbase/stagehand/pull/959) [`09b5e1e`](https://github.com/browserbase/stagehand/commit/09b5e1e9c23c845903686db6665cc968ac34efbb) Thanks [@filip-michalsky](https://github.com/filip-michalsky)! - add webvoyager evals

- [#1049](https://github.com/browserbase/stagehand/pull/1049) [`e3734b9`](https://github.com/browserbase/stagehand/commit/e3734b9c98352d5f0a4eca49791b0bbf2130ab41) Thanks [@miguelg719](https://github.com/miguelg719)! - Support local MCP server connections

- [#1025](https://github.com/browserbase/stagehand/pull/1025) [`be85b19`](https://github.com/browserbase/stagehand/commit/be85b19679a826f19702e00f0aae72fce1118ec8) Thanks [@tkattkat](https://github.com/tkattkat)! - add support for custom baseUrl within openai provider

- [#1040](https://github.com/browserbase/stagehand/pull/1040) [`88d1565`](https://github.com/browserbase/stagehand/commit/88d1565c65bb65a104fea2d5f5e862bbbda69677) Thanks [@miguelg719](https://github.com/miguelg719)! - Allow OpenAI CUA to take in an optional baseURL

- [#1046](https://github.com/browserbase/stagehand/pull/1046) [`ab5d6ed`](https://github.com/browserbase/stagehand/commit/ab5d6ede19aabc059badc4247f1cb2c6c9e71bae) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for gpt-5 in operator agent

## 2.4.4

### Patch Changes

- [#1012](https://github.com/browserbase/stagehand/pull/1012) [`9e8c173`](https://github.com/browserbase/stagehand/commit/9e8c17374fdc8fbe7f26e6cf802c36bd14f11039) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix disabling api validation whenever a customLLM client is provided

## 2.4.3

### Patch Changes

- [#951](https://github.com/browserbase/stagehand/pull/951) [`f45afdc`](https://github.com/browserbase/stagehand/commit/f45afdccc8680650755fee66ffbeac32b41e075d) Thanks [@miguelg719](https://github.com/miguelg719)! - Patch GPT-5 new api format

- [#954](https://github.com/browserbase/stagehand/pull/954) [`261bba4`](https://github.com/browserbase/stagehand/commit/261bba43fa79ac3af95328e673ef3e9fced3279b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add support for shadow DOMs (open & closed mode) when experimental: true

- [#944](https://github.com/browserbase/stagehand/pull/944) [`8de7bd8`](https://github.com/browserbase/stagehand/commit/8de7bd8635c2051cd8025e365c6c8aa83d81c7e7) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - Bump zod version compatibility and add pathing spec

- [#919](https://github.com/browserbase/stagehand/pull/919) [`3d80421`](https://github.com/browserbase/stagehand/commit/3d804210a106a6828c7fa50f8b765b10afd4cc6a) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - enable scrolling inside of iframes

- [#963](https://github.com/browserbase/stagehand/pull/963) [`0ead63d`](https://github.com/browserbase/stagehand/commit/0ead63d6526f6c286362b74b6407c8bebc900e69) Thanks [@tkattkat](https://github.com/tkattkat)! - Properly handle images in evaluator + clean up response parsing logic

- [#961](https://github.com/browserbase/stagehand/pull/961) [`8422828`](https://github.com/browserbase/stagehand/commit/8422828c4cd5fd5ebcf348cfbdb40c768bb76dd9) Thanks [@tkattkat](https://github.com/tkattkat)! - Add more evals for stagehand agent

- [#946](https://github.com/browserbase/stagehand/pull/946) [`b769206`](https://github.com/browserbase/stagehand/commit/b7692060f98a2f49aeeefb90d8789ed034b08ec2) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: unable to act on/get content from some same process iframes

- [#962](https://github.com/browserbase/stagehand/pull/962) [`72d2683`](https://github.com/browserbase/stagehand/commit/72d2683202af7e578d98367893964b33e0828de5) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - handle namespaced elements in xpath build step

## 2.4.2

### Patch Changes

- [#865](https://github.com/browserbase/stagehand/pull/865) [`6b4e6e3`](https://github.com/browserbase/stagehand/commit/6b4e6e3f31d5496cf15728e9018eddeb04839542) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - improve type safety for trimTrailingTextNode

- [#897](https://github.com/browserbase/stagehand/pull/897) [`e77d018`](https://github.com/browserbase/stagehand/commit/e77d0188683ebf596dfb78dfafbbca1dc32993f0) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix selfHeal to remember intially received arguments

- [#920](https://github.com/browserbase/stagehand/pull/920) [`c20adb9`](https://github.com/browserbase/stagehand/commit/c20adb95539fed8c56a4aa413262a9c65a8e6474) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: tab handling on API

- [#882](https://github.com/browserbase/stagehand/pull/882) [`b86df93`](https://github.com/browserbase/stagehand/commit/b86df93b9136aae96292121a29c25f3d74d84bf7) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - remove elements that don't have xpaths from observe response

- [#905](https://github.com/browserbase/stagehand/pull/905) [`023c2c2`](https://github.com/browserbase/stagehand/commit/023c2c273b46d3792d7e5d3c902089487b16b531) Thanks [@tkattkat](https://github.com/tkattkat)! - Delete old images from anthropic cua client

- [#925](https://github.com/browserbase/stagehand/pull/925) [`8c28647`](https://github.com/browserbase/stagehand/commit/8c2864755ecd05c8f7de235d4198deec0dd5f78e) Thanks [@miguelg719](https://github.com/miguelg719)! - Remove \_refreshPageFromApi()

- [#887](https://github.com/browserbase/stagehand/pull/887) [`87e09c6`](https://github.com/browserbase/stagehand/commit/87e09c618940f364ec8af00455a19a17ec63cbd3) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: allow xpaths with prepended 'xpath=' for targeted extract

- [#864](https://github.com/browserbase/stagehand/pull/864) [`a611115`](https://github.com/browserbase/stagehand/commit/a61111525d70b450bdfc43f112380f44899c9e97) Thanks [@miguelg719](https://github.com/miguelg719)! - Temporarily patch custom clients serialization error on api

- [#881](https://github.com/browserbase/stagehand/pull/881) [`69913fe`](https://github.com/browserbase/stagehand/commit/69913fe1dfb8201ae2aeffa5f049fb46ab02cbc2) Thanks [@miguelg719](https://github.com/miguelg719)! - Pass sdk version number to API for debugging

- [#913](https://github.com/browserbase/stagehand/pull/913) [`b1b83a1`](https://github.com/browserbase/stagehand/commit/b1b83a1d334fe76e5f5f9dd32dc92c16b7d40ce6) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - move iframe out of 'experimental'

- [#891](https://github.com/browserbase/stagehand/pull/891) [`be8497c`](https://github.com/browserbase/stagehand/commit/be8497cb6b142cc893cea9692b8c47bd19514c60) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: nested iframe xpath bug

- [#883](https://github.com/browserbase/stagehand/pull/883) [`98704c9`](https://github.com/browserbase/stagehand/commit/98704c9ed225ca25bbde4bb3dc286936e9c54471) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add timeout for JS click

- [#907](https://github.com/browserbase/stagehand/pull/907) [`04978bd`](https://github.com/browserbase/stagehand/commit/04978bdd30d2edcbc69eb9fd91358a16975ea2eb) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - store mapping of CDP frame ID -> page

## 2.4.1

### Patch Changes

- [#856](https://github.com/browserbase/stagehand/pull/856) [`8a43c5a`](https://github.com/browserbase/stagehand/commit/8a43c5a86d4da40cfaedd9cf2e42186928bdf946) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - set download behaviour by default

- [#857](https://github.com/browserbase/stagehand/pull/857) [`890ffcc`](https://github.com/browserbase/stagehand/commit/890ffccac5e0a60ade64a46eb550c981ffb3e84a) Thanks [@miguelg719](https://github.com/miguelg719)! - return "not-supported" for elements inside the shadow-dom

- [#844](https://github.com/browserbase/stagehand/pull/844) [`64c1072`](https://github.com/browserbase/stagehand/commit/64c10727bda50470483a3eb175c02842db0923a1) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - don't automatically close tabs

- [#860](https://github.com/browserbase/stagehand/pull/860) [`b077d3f`](https://github.com/browserbase/stagehand/commit/b077d3f48a97f47a71ccc79ae39b41e7f07f9c04) Thanks [@miguelg719](https://github.com/miguelg719)! - Set default schema on extract options with no schema

- [#842](https://github.com/browserbase/stagehand/pull/842) [`8bcb5d7`](https://github.com/browserbase/stagehand/commit/8bcb5d77debf6bf7601fd5c090efd7fde75c5d5e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - improved handling for OS level dropdowns

- [#846](https://github.com/browserbase/stagehand/pull/846) [`7bf10c5`](https://github.com/browserbase/stagehand/commit/7bf10c55b267078fe847c1d7f7a60d604f9c7c94) Thanks [@miguelg719](https://github.com/miguelg719)! - Filter attaching to target worker / shared_worker

## 2.4.0

### Minor Changes

- [#819](https://github.com/browserbase/stagehand/pull/819) [`6a18c1e`](https://github.com/browserbase/stagehand/commit/6a18c1ee1e46d55c6e90c4d5572e17ed8daa140c) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - try playwright click and fall back to JS click event

### Patch Changes

- [#826](https://github.com/browserbase/stagehand/pull/826) [`124e0d3`](https://github.com/browserbase/stagehand/commit/124e0d3bb54ddb6738ede6d7aa99a945ef1cacd1) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where we are unable to take actions on text nodes

- [#818](https://github.com/browserbase/stagehand/pull/818) [`1660751`](https://github.com/browserbase/stagehand/commit/1660751cd14cb5b27d44f8167216afb8d1c3c45c) Thanks [@miguelg719](https://github.com/miguelg719)! - Added CUA support for Claude 4 models

- [#821](https://github.com/browserbase/stagehand/pull/821) [`cadac9d`](https://github.com/browserbase/stagehand/commit/cadac9da09123d12e5d496a0e8b12660964c1b33) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - use playwright instead of playwright test

- [#832](https://github.com/browserbase/stagehand/pull/832) [`759da55`](https://github.com/browserbase/stagehand/commit/759da55775eb2df81d56ae18c0f386fd9b02a9f0) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix \_refreshPageFromAPI to use parametrized apiKey

- [#810](https://github.com/browserbase/stagehand/pull/810) [`a175a51`](https://github.com/browserbase/stagehand/commit/a175a519b8c14300db6f1ed30709e113d18e99db) Thanks [@miguelg719](https://github.com/miguelg719)! - Update logos

- [#822](https://github.com/browserbase/stagehand/pull/822) [`8527a80`](https://github.com/browserbase/stagehand/commit/8527a80522c3eedb9516a6caa1a0e4e4be981a3d) Thanks [@miguelg719](https://github.com/miguelg719)! - Add model with date tag for OpenAI CUA

- [#833](https://github.com/browserbase/stagehand/pull/833) [`55fca2f`](https://github.com/browserbase/stagehand/commit/55fca2f7da63cc0ef6e27b45a33f63c666cdce7e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - adjust stagehandLogger.warn() level to be 1 instead of 0

## 2.3.1

### Patch Changes

- [#796](https://github.com/browserbase/stagehand/pull/796) [`12a99b3`](https://github.com/browserbase/stagehand/commit/12a99b398d8a4c3eea3ca69a3cf793faaaf4aea3) Thanks [@miguelg719](https://github.com/miguelg719)! - Added a experimental flag to enable the newest and most experimental features

- [#807](https://github.com/browserbase/stagehand/pull/807) [`2451797`](https://github.com/browserbase/stagehand/commit/2451797f64c0efa4a72fd70265110003c8d0a6cd) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - include version number in StagehandDefaultError message

- [#803](https://github.com/browserbase/stagehand/pull/803) [`1d631a5`](https://github.com/browserbase/stagehand/commit/1d631a57a197390f672b718ae5199991ab27cfb1) Thanks [@miguelg719](https://github.com/miguelg719)! - Enable session affinity for cache optimization

- [#804](https://github.com/browserbase/stagehand/pull/804) [`9c398bb`](https://github.com/browserbase/stagehand/commit/9c398bb9ec2d10bdb53ad5aa7e3b58cce24fdb2b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - update operatorResponseSchema based on new openai spec

- [#786](https://github.com/browserbase/stagehand/pull/786) [`c19ad7f`](https://github.com/browserbase/stagehand/commit/c19ad7f1e082e91fdeaa9c2ef63767a5a2b3a195) Thanks [@miguelg719](https://github.com/miguelg719)! - Handle reroute to account for rollout

## 2.3.0

### Minor Changes

- [#737](https://github.com/browserbase/stagehand/pull/737) [`6ef6073`](https://github.com/browserbase/stagehand/commit/6ef60730cab0ad9025f44b6eeb2c83751d1dcd35) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - deprecate useTextExtract and remove functionality

### Patch Changes

- [#741](https://github.com/browserbase/stagehand/pull/741) [`5680d25`](https://github.com/browserbase/stagehand/commit/5680d2509352c383ad502c9f4fabde01fa638833) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - use safeparse for zod validation

- [#783](https://github.com/browserbase/stagehand/pull/783) [`4de92a8`](https://github.com/browserbase/stagehand/commit/4de92a8af461fc95063faf39feee1d49259f58ba) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix the readme logo link

## 2.2.1

### Patch Changes

- [#721](https://github.com/browserbase/stagehand/pull/721) [`be8652e`](https://github.com/browserbase/stagehand/commit/be8652e770b57fdb3299fa0b2efa4eb0e816434e) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix stagehand.close() functionality to include calling browser.close()

- [#724](https://github.com/browserbase/stagehand/pull/724) [`6b413b7`](https://github.com/browserbase/stagehand/commit/6b413b7ad00b13ca0bd53ee2e7393023821408b6) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - rm refine step in extract

- [#712](https://github.com/browserbase/stagehand/pull/712) [`7eafbd9`](https://github.com/browserbase/stagehand/commit/7eafbd9b1a73b37effa444929767df7c592caf02) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - deprecated `onlyVisible` param and remove its functionality

- [#725](https://github.com/browserbase/stagehand/pull/725) [`1b50aa6`](https://github.com/browserbase/stagehand/commit/1b50aa61cf0a429dd6cb2760a08f7f698a50454b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - dont overwrite .describe() when user defines a zod schema with z.string().url().describe()

- [#717](https://github.com/browserbase/stagehand/pull/717) [`f2b7f1f`](https://github.com/browserbase/stagehand/commit/f2b7f1f284eef1f96753319b66c7d0b273a6f8cd) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - don't publish uncompiled ts to npm

- [#719](https://github.com/browserbase/stagehand/pull/719) [`c8d672f`](https://github.com/browserbase/stagehand/commit/c8d672f7c410c256defbc2e87ead99239837aa28) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix `Invalid schema for response_format` error when extracting links

- [#722](https://github.com/browserbase/stagehand/pull/722) [`bebf204`](https://github.com/browserbase/stagehand/commit/bebf2044502333c694743078c5b0c9deae11fb79) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - replace NBSP with regular space & remove special characters from dom+a11y tree

- [#714](https://github.com/browserbase/stagehand/pull/714) [`37d6810`](https://github.com/browserbase/stagehand/commit/37d6810a704773d0383a86f98f5f17c7d5b21975) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix the native AI SDK client implementation to optionally take in an API key

## 2.2.0

### Minor Changes

- [#655](https://github.com/browserbase/stagehand/pull/655) [`8814af9`](https://github.com/browserbase/stagehand/commit/8814af9ece99fddc3dd9fb32671d0513a3a00c67) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - extract links

- [#675](https://github.com/browserbase/stagehand/pull/675) [`35c55eb`](https://github.com/browserbase/stagehand/commit/35c55ebf6c2867801a0a6f6988a883c8cb90cf9a) Thanks [@tkattkat](https://github.com/tkattkat)! - Added Gemini 2.5 Flash to Google supported models

- [#668](https://github.com/browserbase/stagehand/pull/668) [`5c6d2cf`](https://github.com/browserbase/stagehand/commit/5c6d2cf89c9fbf198485506ed9ed75e07aec5cd4) Thanks [@miguelg719](https://github.com/miguelg719)! - Added a new class - Stagehand Evaluator - that wraps around a Stagehand object to determine whether a task is successful or not. Currently used for agent evals

### Patch Changes

- [#706](https://github.com/browserbase/stagehand/pull/706) [`18ac6fb`](https://github.com/browserbase/stagehand/commit/18ac6fba30f45b7557cecb890f4e84c75de8383c) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - remove unused fillInVariables fn

- [#692](https://github.com/browserbase/stagehand/pull/692) [`6b95248`](https://github.com/browserbase/stagehand/commit/6b95248d6e02e5304ce4dd60499e31fc42af57eb) Thanks [@miguelg719](https://github.com/miguelg719)! - Updated the list of OpenAI models (4.1, o3...)

- [#688](https://github.com/browserbase/stagehand/pull/688) [`7d81b3c`](https://github.com/browserbase/stagehand/commit/7d81b3c951c1f3dfc46845aefcc26ff175299bca) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - wrap page.evaluate to make sure we have injected browser side scripts before calling them

- [#664](https://github.com/browserbase/stagehand/pull/664) [`b5ca00a`](https://github.com/browserbase/stagehand/commit/b5ca00a25ad0c33a5f4d3198e1bc59edb9956e7c) Thanks [@miguelg719](https://github.com/miguelg719)! - remove unnecessary log

- [#683](https://github.com/browserbase/stagehand/pull/683) [`8f0f97b`](https://github.com/browserbase/stagehand/commit/8f0f97bc491e23ff0078c802aaf509fd04173c37) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - use javsacript click instead of playwright

- [#705](https://github.com/browserbase/stagehand/pull/705) [`346ef5d`](https://github.com/browserbase/stagehand/commit/346ef5d0132dc1418dac18d26640a8df0435af57) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixed removing a hanging observation map that is no longer used

- [#698](https://github.com/browserbase/stagehand/pull/698) [`c145bc1`](https://github.com/browserbase/stagehand/commit/c145bc1d90ffd0d71c412de3af1c26c121e0b101) Thanks [@sameelarif](https://github.com/sameelarif)! - Fixing LLM client support to natively integrate with AI SDK

- [#687](https://github.com/browserbase/stagehand/pull/687) [`edd6d3f`](https://github.com/browserbase/stagehand/commit/edd6d3feb47aac9f312a5edad78bf850ae1541db) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixed the schema input for Gemini's response model

- [#678](https://github.com/browserbase/stagehand/pull/678) [`5ec43d8`](https://github.com/browserbase/stagehand/commit/5ec43d8b9568c0f86b3e24bd83d1826c837656ed) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - allow form filling when form is not top-most element

- [#694](https://github.com/browserbase/stagehand/pull/694) [`b8cc164`](https://github.com/browserbase/stagehand/commit/b8cc16405b712064a54c8cd591750368a47f35ea) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add telemetry for cua agents to stagehand.metrics

- [#699](https://github.com/browserbase/stagehand/pull/699) [`d9f4243`](https://github.com/browserbase/stagehand/commit/d9f4243f6a8c8d4f3003ad6589f7eb4da6d23d0f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - rm deprecated primitives from stagehand object

- [#710](https://github.com/browserbase/stagehand/pull/710) [`9f4ab76`](https://github.com/browserbase/stagehand/commit/9f4ab76a0c1f0c2171290765c48c3bcea5b50e0f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - support targeted extract for domExtract

- [#677](https://github.com/browserbase/stagehand/pull/677) [`bc5a731`](https://github.com/browserbase/stagehand/commit/bc5a731241f7f4c5040dd672d8e3787555766421) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixes a redundant unnecessary log

## 2.1.0

### Minor Changes

- [#659](https://github.com/browserbase/stagehand/pull/659) [`f9a435e`](https://github.com/browserbase/stagehand/commit/f9a435e938daccfb2e54ca23fad8ef75128a4486) Thanks [@miguelg719](https://github.com/miguelg719)! - Added native support for Google Generative models (Gemini)

### Patch Changes

- [#647](https://github.com/browserbase/stagehand/pull/647) [`ca5467d`](https://github.com/browserbase/stagehand/commit/ca5467de7d31bfb270b6b625224a926c52c97900) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - collapse redundant text nodes into parent elements

- [#636](https://github.com/browserbase/stagehand/pull/636) [`9037430`](https://github.com/browserbase/stagehand/commit/903743097367ba6bb12baa9f0fa8f7985f543fdc) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix token act metrics and inference logging being misplaced as observe metrics and inference logging

- [#648](https://github.com/browserbase/stagehand/pull/648) [`169e7ea`](https://github.com/browserbase/stagehand/commit/169e7ea9e229503ae5958eaa4511531578ee3841) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add mapping of node id -> url

- [#654](https://github.com/browserbase/stagehand/pull/654) [`57a9853`](https://github.com/browserbase/stagehand/commit/57a98538381e0e54fbb734b43c50d61fd0d567df) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix repeated up & down scrolling bug for clicks inside `act`

- [#624](https://github.com/browserbase/stagehand/pull/624) [`cf167a4`](https://github.com/browserbase/stagehand/commit/cf167a437865e8e8bdb8739d22c3b3bb84e185de) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - export stagehand error classes so they can be referenced from @dist

- [#640](https://github.com/browserbase/stagehand/pull/640) [`178f5f0`](https://github.com/browserbase/stagehand/commit/178f5f0a8fecd876adfb4e29983853bdf7ec72fd) Thanks [@yash1744](https://github.com/yash1744)! - Added support for stagehand agents to automatically redirect to https://google.com when the page URL is empty or set to about:blank, preventing empty screenshots and saving tokens.

- [#661](https://github.com/browserbase/stagehand/pull/661) [`bf823a3`](https://github.com/browserbase/stagehand/commit/bf823a36930b0686b416a42302ef8c021b4aba75) Thanks [@kamath](https://github.com/kamath)! - fix press enter

- [#633](https://github.com/browserbase/stagehand/pull/633) [`86724f6`](https://github.com/browserbase/stagehand/commit/86724f6fb0abc7292423ac5bd0bebcd352f95940) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix the getBrowser logic for redundant api calls and throw informed errors

- [#656](https://github.com/browserbase/stagehand/pull/656) [`c630373`](https://github.com/browserbase/stagehand/commit/c630373dede4c775875834bfb860436ba2ea48d2) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - parse out % signs from variables in act

- [#637](https://github.com/browserbase/stagehand/pull/637) [`944bbbf`](https://github.com/browserbase/stagehand/commit/944bbbfe8bfb357b4910584447a93f6f402c3826) Thanks [@kamath](https://github.com/kamath)! - Fix: forward along the stack trace in StagehandDefaultError

## 2.0.0

### Major Changes

- [#591](https://github.com/browserbase/stagehand/pull/591) [`e234a0f`](https://github.com/browserbase/stagehand/commit/e234a0f80bf4c07bcc57265da216cbc4ab3bd19d) Thanks [@miguelg719](https://github.com/miguelg719)! - Announcing **Stagehand 2.0**! 🎉

  We're thrilled to announce the release of Stagehand 2.0, bringing significant improvements to make browser automation more powerful, faster, and easier to use than ever before.

  ### 🚀 New Features

  - **Introducing `stagehand.agent`**: A powerful new way to integrate SOTA Computer use models or Browserbase's [Open Operator](https://operator.browserbase.com) into Stagehand with one line of code! Perfect for multi-step workflows and complex interactions. [Learn more](https://docs.stagehand.dev/concepts/agent)
  - **Lightning-fast `act` and `extract`**: Major performance improvements to make your automations run significantly faster.
  - **Enhanced Logging**: Better visibility into what's happening during automation with improved logging and debugging capabilities.
  - **Comprehensive Documentation**: A completely revamped documentation site with better examples, guides, and best practices.
  - **Improved Error Handling**: More descriptive errors and better error recovery to help you debug issues faster.

  ### 🛠️ Developer Experience

  - **Better TypeScript Support**: Enhanced type definitions and better IDE integration
  - **Better Error Messages**: Clearer, more actionable error messages to help you debug faster
  - **Improved Caching**: More reliable action caching for better performance

  We're excited to see what you build with Stagehand 2.0! For questions or support, join our [Slack community](https://stagehand.dev/slack).

  For more details, check out our [documentation](https://docs.stagehand.dev).

### Minor Changes

- [#588](https://github.com/browserbase/stagehand/pull/588) [`ba9efc5`](https://github.com/browserbase/stagehand/commit/ba9efc5580a536bc3c158e507a6c6695825c2834) Thanks [@sameelarif](https://github.com/sameelarif)! - Added support for offloading agent tasks to the API.

- [#600](https://github.com/browserbase/stagehand/pull/600) [`11e015d`](https://github.com/browserbase/stagehand/commit/11e015daac56dc961b8c8d54ce360fd00d4fee38) Thanks [@sameelarif](https://github.com/sameelarif)! - Added a `stagehand.history` array which stores an array of `act`, `extract`, `observe`, and `goto` calls made. Since this history array is stored on the `StagehandPage` level, it will capture methods even if indirectly called by an agent.

- [#601](https://github.com/browserbase/stagehand/pull/601) [`1d22604`](https://github.com/browserbase/stagehand/commit/1d2260401e27bae25779a55bb2ed7b7153c34fd0) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add custom error classes

- [#599](https://github.com/browserbase/stagehand/pull/599) [`75d8fb3`](https://github.com/browserbase/stagehand/commit/75d8fb36a67cd84eb55b509bf959edc7b05059da) Thanks [@miguelg719](https://github.com/miguelg719)! - cleaner logging with pino

- [#609](https://github.com/browserbase/stagehand/pull/609) [`c92295d`](https://github.com/browserbase/stagehand/commit/c92295d8424dac1a4f81066ca260ade2d5fce80b) Thanks [@kamath](https://github.com/kamath)! - Removed deprecated fields and methods from Stagehand constructor and added cdpUrl to localBrowserLaunchOptions for custom CDP URLs support.

- [#571](https://github.com/browserbase/stagehand/pull/571) [`73d6736`](https://github.com/browserbase/stagehand/commit/73d67368b88002c17814e46e75a99456bf355c4e) Thanks [@miguelg719](https://github.com/miguelg719)! - You can now use Computer Using Agents (CUA) natively in Stagehand for both Anthropic and OpenAI models! This unlocks a brand new frontier of applications for Stagehand users 🤘

- [#619](https://github.com/browserbase/stagehand/pull/619) [`7b0b996`](https://github.com/browserbase/stagehand/commit/7b0b9969a58014ae3e99b2054e4463b785073cfd) Thanks [@sameelarif](https://github.com/sameelarif)! - add disablePino flag to stagehand constructor params

- [#620](https://github.com/browserbase/stagehand/pull/620) [`566e587`](https://github.com/browserbase/stagehand/commit/566e5877a1861e0eae5a118d34efe09d43a37098) Thanks [@kamath](https://github.com/kamath)! - You can now pass in an OpenAI instance as an `llmClient` to the Stagehand constructor! This allows you to use Stagehand with any OpenAI-compatible model, like Ollama, Gemini, etc., as well as OpenAI wrappers like Braintrust.

- [#586](https://github.com/browserbase/stagehand/pull/586) [`c57dc19`](https://github.com/browserbase/stagehand/commit/c57dc19c448b8c2aab82953291f4e38f202c4729) Thanks [@sameelarif](https://github.com/sameelarif)! - Added native Stagehand agentic loop functionality. This allows you to build agentic workflows with a single prompt without using a computer-use model. To try it out, create a `stagehand.agent` without passing in a provider.

### Patch Changes

- [#580](https://github.com/browserbase/stagehand/pull/580) [`179e17c`](https://github.com/browserbase/stagehand/commit/179e17c2d1c9837de49c776d9850a330a759e73f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - refactor \_performPlaywrightMethod

- [#608](https://github.com/browserbase/stagehand/pull/608) [`71ee10d`](https://github.com/browserbase/stagehand/commit/71ee10d50cb46e83d43fd783e1404569e6f317cf) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - added support for "scrolling to next/previous chunk"

- [#594](https://github.com/browserbase/stagehand/pull/594) [`e483484`](https://github.com/browserbase/stagehand/commit/e48348412a6e651967ba22d097d5308af0e8d0a8) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - pass observeHandler into actHandler

- [#569](https://github.com/browserbase/stagehand/pull/569) [`17e8b40`](https://github.com/browserbase/stagehand/commit/17e8b40f94b30f6e253443a4bbb8a3e364e58e38) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - you can now call stagehand.metrics to get token usage metrics. you can also set logInferenceToFile in stagehand config to log the entire call/response history from stagehand & the LLM.

- [#617](https://github.com/browserbase/stagehand/pull/617) [`affa564`](https://github.com/browserbase/stagehand/commit/affa5646658399ab71ed08c1b9ce0fd776b46fca) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - use a11y tree for default extract

- [#589](https://github.com/browserbase/stagehand/pull/589) [`0c4b1e7`](https://github.com/browserbase/stagehand/commit/0c4b1e7e6ff4b8a60af4a2d0d2056bff847227d5) Thanks [@miguelg719](https://github.com/miguelg719)! - Added CDP support for screenshots, find more about the benefits here: https://docs.browserbase.com/features/screenshots#why-use-cdp-for-screenshots%3F

- [#584](https://github.com/browserbase/stagehand/pull/584) [`c7c1a80`](https://github.com/browserbase/stagehand/commit/c7c1a8066be33188ba1e900828045db61410025c) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix to remove unnecessary healtcheck ping on sdk

- [#616](https://github.com/browserbase/stagehand/pull/616) [`2a27e1c`](https://github.com/browserbase/stagehand/commit/2a27e1c8e967befbbbb05ea71369878ac1573658) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixed new opened tab handling for CUA models

- [#582](https://github.com/browserbase/stagehand/pull/582) [`dfd24e6`](https://github.com/browserbase/stagehand/commit/dfd24e638ef3723d3a8a3a33ff7942af0ac4745f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - support api usage for extract with no args

- [#563](https://github.com/browserbase/stagehand/pull/563) [`98166d7`](https://github.com/browserbase/stagehand/commit/98166d76d30bc67d6b04b3d5c39f78f92c254b49) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - support scrolling in `act`

- [#598](https://github.com/browserbase/stagehand/pull/598) [`53889d4`](https://github.com/browserbase/stagehand/commit/53889d4b6e772098beaba2e1ee5a24e6f07706bb) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix the open operator handler to work with anthropic

- [#605](https://github.com/browserbase/stagehand/pull/605) [`b8beaec`](https://github.com/browserbase/stagehand/commit/b8beaec451a03eaa5d12281fe7c8d4eb9c9d7e81) Thanks [@sameelarif](https://github.com/sameelarif)! - Added support for resuming a Stagehand session created on the API.

- [#612](https://github.com/browserbase/stagehand/pull/612) [`cd36068`](https://github.com/browserbase/stagehand/commit/cd3606854c465747c78b44763469dfdfa16db1b0) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - remove all logic related to dom based act

- [#577](https://github.com/browserbase/stagehand/pull/577) [`4fdbf63`](https://github.com/browserbase/stagehand/commit/4fdbf6324a0dc68568bba73ea4d9018b2ed67849) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - remove debugDom

- [#603](https://github.com/browserbase/stagehand/pull/603) [`2a14a60`](https://github.com/browserbase/stagehand/commit/2a14a607f3e7fa3ca9a02670afdc7e60ccfbfb3f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - rm unused handlePossiblePageNavigation

- [#614](https://github.com/browserbase/stagehand/pull/614) [`a59eaef`](https://github.com/browserbase/stagehand/commit/a59eaef67c2f4a0cb07bb0046fe7e93e2ba4dc41) Thanks [@kamath](https://github.com/kamath)! - override whatwg-url to avoid punycode warning

- [#573](https://github.com/browserbase/stagehand/pull/573) [`c24f3c9`](https://github.com/browserbase/stagehand/commit/c24f3c9a58873c3920fab0f9891c2bf5245c9b5e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - return act result in actFromObserve

## 1.14.0

### Minor Changes

- [#518](https://github.com/browserbase/stagehand/pull/518) [`516725f`](https://github.com/browserbase/stagehand/commit/516725fc1c5d12d22caac0078a118c77bfe033a8) Thanks [@sameelarif](https://github.com/sameelarif)! - `act()` can now use `observe()` under the hood, resulting in significant performance improvements. To opt-in to this change, set `slowDomBasedAct: false` in `ActOptions`.

- [#483](https://github.com/browserbase/stagehand/pull/483) [`8c9445f`](https://github.com/browserbase/stagehand/commit/8c9445fde9724ae33eeeb1234fd5b9bbd418bfdb) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - When using `textExtract`, you can now do targetted extraction by passing an xpath string into extract via the `selector` parameter. This limits the dom processing step to a target element, reducing tokens and increasing speed. For example:

  ```typescript
  const weatherData = await stagehand.page.extract({
    instruction: "extract the weather data for Sun, Feb 23 at 11PM",
    schema: z.object({
      temperature: z.string(),
      weather_description: z.string(),
      wind: z.string(),
      humidity: z.string(),
      barometer: z.string(),
      visibility: z.string(),
    }),
    modelName,
    useTextExtract,
    selector: xpath, // xpath of the element to extract from
  });
  ```

- [#556](https://github.com/browserbase/stagehand/pull/556) [`499a72d`](https://github.com/browserbase/stagehand/commit/499a72dc56009791ce065270b854b12fc5570050) Thanks [@kamath](https://github.com/kamath)! - You can now set a timeout for dom-based stagehand act! Do this in `act` with `timeoutMs` as a parameter, or set a global param to `actTimeoutMs` in Stagehand config.

- [#544](https://github.com/browserbase/stagehand/pull/544) [`55c9673`](https://github.com/browserbase/stagehand/commit/55c9673c5948743b804d70646f425a61818c7789) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - you can now deterministically get the full text representation of a webpage by calling `extract()` (with no arguments)

- [#538](https://github.com/browserbase/stagehand/pull/538) [`d898d5b`](https://github.com/browserbase/stagehand/commit/d898d5b9e1c3b80e62e72d36d1754b3e50d5a2b4) Thanks [@sameelarif](https://github.com/sameelarif)! - Added `gpt-4.5-preview` and `claude-3-7-sonnet-latest` as supported models.

- [#523](https://github.com/browserbase/stagehand/pull/523) [`44cf7cc`](https://github.com/browserbase/stagehand/commit/44cf7cc9ac1209c97d9153281970899b10a2ddc9) Thanks [@kwt00](https://github.com/kwt00)! You can now natively run Cerebras LLMs! `cerebras-llama-3.3-70b` and `cerebras-llama-3.1-8b` are now supported models as long as `CEREBRAS_API_KEY` is set in your environment.

- [#542](https://github.com/browserbase/stagehand/pull/542) [`cf7fe66`](https://github.com/browserbase/stagehand/commit/cf7fe665e6d1eeda97582ee2816f1dc3a66c6152) Thanks [@sankalpgunturi](https://github.com/sankalpgunturi)! You can now natively run Groq LLMs! `groq-llama-3.3-70b-versatile` and `groq-llama-3.3-70b-specdec` are now supported models as long as `GROQ_API_KEY` is set in your environment.

### Patch Changes

- [#506](https://github.com/browserbase/stagehand/pull/506) [`e521645`](https://github.com/browserbase/stagehand/commit/e5216455ce3fc2a4f4f7aa5614ecc92354eb670c) Thanks [@miguelg719](https://github.com/miguelg719)! - fixing 5s timeout on actHandler

- [#535](https://github.com/browserbase/stagehand/pull/535) [`3782054`](https://github.com/browserbase/stagehand/commit/3782054734dcd0346f84003ddd8e0e484b379459) Thanks [@miguelg719](https://github.com/miguelg719)! - Adding backwards compatibility to new act->observe pipeline by accepting actOptions

- [#508](https://github.com/browserbase/stagehand/pull/508) [`270f666`](https://github.com/browserbase/stagehand/commit/270f6669f1638f52fd5cd3f133f76446ced6ef9f) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixed stagehand to support multiple pages with an enhanced context

- [#559](https://github.com/browserbase/stagehand/pull/559) [`18533ad`](https://github.com/browserbase/stagehand/commit/18533ad824722e4e699323248297e184bae9254e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: continuously adjusting chunk size inside `act`

- [#554](https://github.com/browserbase/stagehand/pull/554) [`5f1868b`](https://github.com/browserbase/stagehand/commit/5f1868bd95478b3eb517319ebca7b0af4e91d144) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix targetted extract issue with scrollintoview and not chunking correctly

- [#555](https://github.com/browserbase/stagehand/pull/555) [`fc5e8b6`](https://github.com/browserbase/stagehand/commit/fc5e8b6c5a606da96e6ed572dc8ffc6caef57576) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where processAllOfDom doesnt scroll to end of page when there is dynamic content

- [#552](https://github.com/browserbase/stagehand/pull/552) [`a25a4cb`](https://github.com/browserbase/stagehand/commit/a25a4cb538d64f50b5bd834dd88e8e6086a73078) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - accept xpaths with 'xpath=' prepended to the front in addition to xpaths without

- [#534](https://github.com/browserbase/stagehand/pull/534) [`f0c162a`](https://github.com/browserbase/stagehand/commit/f0c162a6b4d1ac72c42f26462d7241a08b5c4e0a) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - call this.end() if the process exists

- [#528](https://github.com/browserbase/stagehand/pull/528) [`c820bfc`](https://github.com/browserbase/stagehand/commit/c820bfcfc9571fea90afd1595775c5946118cfaf) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - handle attempt to close session that has already been closed when using the api

- [#520](https://github.com/browserbase/stagehand/pull/520) [`f49eebd`](https://github.com/browserbase/stagehand/commit/f49eebd98c1d61413a3ea4c798595db601d55da8) Thanks [@miguelg719](https://github.com/miguelg719)! - Performing act from a 'not-supported' ObserveResult will now throw an informed error

## 1.13.1

### Patch Changes

- [#509](https://github.com/browserbase/stagehand/pull/509) [`a7d345e`](https://github.com/browserbase/stagehand/commit/a7d345e75434aebb656e1aa5aa61caed00dc99a8) Thanks [@miguelg719](https://github.com/miguelg719)! - Bun runs will now throw a more informed error

## 1.13.0

### Minor Changes

- [#486](https://github.com/browserbase/stagehand/pull/486) [`33f2b3f`](https://github.com/browserbase/stagehand/commit/33f2b3f8deff86ac2073b6d35b7413b0aeaba2f9) Thanks [@sameelarif](https://github.com/sameelarif)! - [Unreleased] Parameterized offloading Stagehand method calls to the Stagehand API. In the future, this will allow for better observability and debugging experience.

- [#494](https://github.com/browserbase/stagehand/pull/494) [`9ba4b0b`](https://github.com/browserbase/stagehand/commit/9ba4b0b563cbc77d40cac31c11e17e365a9d1749) Thanks [@pkiv](https://github.com/pkiv)! - Added LocalBrowserLaunchOptions to provide comprehensive configuration options for local browser instances. Deprecated the top-level headless option in favor of using localBrowserLaunchOptions.headless

- [#500](https://github.com/browserbase/stagehand/pull/500) [`a683fab`](https://github.com/browserbase/stagehand/commit/a683fab9ca90c45d78f6602a228c2d3219b776dc) Thanks [@miguelg719](https://github.com/miguelg719)! - Including Iframes in ObserveResults. This appends any iframe(s) found in the page to the end of observe results on any observe call.

- [#504](https://github.com/browserbase/stagehand/pull/504) [`577662e`](https://github.com/browserbase/stagehand/commit/577662e985a6a6b0477815853d98610f3a6b567d) Thanks [@sameelarif](https://github.com/sameelarif)! - Enabled support for Browserbase captcha solving after page navigations. This can be enabled with the new constructor parameter: `waitForCaptchaSolves`.

- [#496](https://github.com/browserbase/stagehand/pull/496) [`28ca9fb`](https://github.com/browserbase/stagehand/commit/28ca9fbc6f3cdc88437001108a9a6c4388ba0303) Thanks [@sameelarif](https://github.com/sameelarif)! - Fixed browserbaseSessionCreateParams not being passed in to the API initialization payload.

### Patch Changes

- [#459](https://github.com/browserbase/stagehand/pull/459) [`62a29ee`](https://github.com/browserbase/stagehand/commit/62a29eea982bbb855e2f885c09ac4c1334f3e0dc) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - create a11y + dom hybrid input for observe

- [#463](https://github.com/browserbase/stagehand/pull/463) [`e40bf6f`](https://github.com/browserbase/stagehand/commit/e40bf6f517331fc9952c3c9f2683b7e02ffb9735) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - include 'Scrollable' annotations in a11y-dom hybrid

- [#480](https://github.com/browserbase/stagehand/pull/480) [`4c07c44`](https://github.com/browserbase/stagehand/commit/4c07c444f0e71faf54413b2eeab760c7916a36e3) Thanks [@miguelg719](https://github.com/miguelg719)! - Adding a fallback try on actFromObserveResult to use the description from observe and call regular act.

- [#487](https://github.com/browserbase/stagehand/pull/487) [`2c855cf`](https://github.com/browserbase/stagehand/commit/2c855cffdfa2b0af9924612b9c59df7b65df6443) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - update refine extraction prompt to ensure correct schema is used

- [#497](https://github.com/browserbase/stagehand/pull/497) [`945ed04`](https://github.com/browserbase/stagehand/commit/945ed0426d34d2cb833aec8ba67bd4cba6c3b660) Thanks [@kamath](https://github.com/kamath)! - add gpt 4o november snapshot

## 1.12.0

### Minor Changes

- [#426](https://github.com/browserbase/stagehand/pull/426) [`bbbcee7`](https://github.com/browserbase/stagehand/commit/bbbcee7e7d86f5bf90cbb93f2ac9ad5935f15896) Thanks [@miguelg719](https://github.com/miguelg719)! - Observe got a major upgrade. Now it will return a suggested playwright method with any necessary arguments for the generated candidate elements. It also includes a major speedup when using a11y tree processing for context.

- [#452](https://github.com/browserbase/stagehand/pull/452) [`16837ec`](https://github.com/browserbase/stagehand/commit/16837ece839e192fbf7b68bec128dd02f22c2613) Thanks [@kamath](https://github.com/kamath)! - add o3-mini to availablemodel

- [#441](https://github.com/browserbase/stagehand/pull/441) [`1032d7d`](https://github.com/browserbase/stagehand/commit/1032d7d7d9c1ef8f30183c9019ea8324f1bdd5c6) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - allow act to accept observe output

### Patch Changes

- [#458](https://github.com/browserbase/stagehand/pull/458) [`da2e5d1`](https://github.com/browserbase/stagehand/commit/da2e5d1314b7504877fd50090e6a4b47f44fb9f6) Thanks [@miguelg719](https://github.com/miguelg719)! - Updated getAccessibilityTree() to make sure it doesn't skip useful nodes. Improved getXPathByResolvedObjectId() to account for text nodes and not skip generation

- [#448](https://github.com/browserbase/stagehand/pull/448) [`b216072`](https://github.com/browserbase/stagehand/commit/b2160723923ed78eba83e75c7270634ca7d217de) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - improve handling of radio button clicks

- [#445](https://github.com/browserbase/stagehand/pull/445) [`5bc514f`](https://github.com/browserbase/stagehand/commit/5bc514fc18e6634b1c81553bbc1e8b7d71b67d34) Thanks [@miguelg719](https://github.com/miguelg719)! - Adding back useAccessibilityTree param to observe with a deprecation warning/error indicating to use onlyVisible instead

## 1.11.0

### Minor Changes

- [#428](https://github.com/browserbase/stagehand/pull/428) [`5efeb5a`](https://github.com/browserbase/stagehand/commit/5efeb5ad44852efe7b260862729a5ac74eaa0228) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - temporarily remove vision

## 1.10.1

### Patch Changes

- [#422](https://github.com/browserbase/stagehand/pull/422) [`a2878d0`](https://github.com/browserbase/stagehand/commit/a2878d0acaf393b37763fb0c07b1a24043f7eb8d) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixing a build type error for async functions being called inside evaulate for observeHandler.

## 1.10.0

### Minor Changes

- [#412](https://github.com/browserbase/stagehand/pull/412) [`4aa4813`](https://github.com/browserbase/stagehand/commit/4aa4813ad62cefc333a04ea6b1004f5888dec70f) Thanks [@miguelg719](https://github.com/miguelg719)! - Includes a new format to get website context using accessibility (a11y) trees. The new context is provided optionally with the flag useAccessibilityTree for observe tasks.

- [#417](https://github.com/browserbase/stagehand/pull/417) [`1f2b2c5`](https://github.com/browserbase/stagehand/commit/1f2b2c57d93e3b276c61224e1e26c65c2cb50e12) Thanks [@sameelarif](https://github.com/sameelarif)! - Simplify Stagehand method calls by allowing a simple string input instead of an options object.

- [#405](https://github.com/browserbase/stagehand/pull/405) [`0df1e23`](https://github.com/browserbase/stagehand/commit/0df1e233d4ad4ba39da457b6ed85916d8d20e12e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - in ProcessAllOfDom, scroll on large scrollable elements instead of just the root DOM

- [#373](https://github.com/browserbase/stagehand/pull/373) [`ff00965`](https://github.com/browserbase/stagehand/commit/ff00965160d568ae0bc3ca437c01f95b5c6e9039) Thanks [@sameelarif](https://github.com/sameelarif)! - Allow the input of custom instructions into the constructor so that users can guide, or provide guardrails to, the LLM in making decisions.

### Patch Changes

- [#386](https://github.com/browserbase/stagehand/pull/386) [`2cee0a4`](https://github.com/browserbase/stagehand/commit/2cee0a45ae2b48d1de6543b196e338e7021e59fe) Thanks [@kamath](https://github.com/kamath)! - add demo gif

- [#362](https://github.com/browserbase/stagehand/pull/362) [`9c20de3`](https://github.com/browserbase/stagehand/commit/9c20de3e66f0ac20374d5e5e02eb107c620a2263) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - reduce collisions and improve accuracy of textExtract

- [#413](https://github.com/browserbase/stagehand/pull/413) [`737b4b2`](https://github.com/browserbase/stagehand/commit/737b4b208c9214e8bb22535ab7a8daccf37610d9) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - remove topMostElement check when verifying visibility of text nodes

- [#388](https://github.com/browserbase/stagehand/pull/388) [`e93561d`](https://github.com/browserbase/stagehand/commit/e93561d7875210ce7bd7fe841fb52decf6011fb3) Thanks [@kamath](https://github.com/kamath)! - Export LLMClient type

## 1.9.0

### Minor Changes

- [#374](https://github.com/browserbase/stagehand/pull/374) [`207244e`](https://github.com/browserbase/stagehand/commit/207244e3a46c4474d4d28db039eab131164790ca) Thanks [@sameelarif](https://github.com/sameelarif)! - Pass in a Stagehand Page object into the `on("popup")` listener to allow for multi-page handling.

- [#367](https://github.com/browserbase/stagehand/pull/367) [`75c0e20`](https://github.com/browserbase/stagehand/commit/75c0e20cde54951399753e0fa841df463e1271b8) Thanks [@kamath](https://github.com/kamath)! - Logger in LLMClient is inherited by default from Stagehand. Named rather than positional arguments are used in implemented LLMClients.

- [#381](https://github.com/browserbase/stagehand/pull/381) [`db2ef59`](https://github.com/browserbase/stagehand/commit/db2ef5997664e81b1dfb5ca992392362f2d3bab1) Thanks [@kamath](https://github.com/kamath)! - make logs only sync

- [#385](https://github.com/browserbase/stagehand/pull/385) [`5899ec2`](https://github.com/browserbase/stagehand/commit/5899ec2c4b73c636bfd8120ec3aac225af7dd949) Thanks [@sameelarif](https://github.com/sameelarif)! - Moved the LLMClient logger paremeter to the createChatCompletion method options.

- [#364](https://github.com/browserbase/stagehand/pull/364) [`08907eb`](https://github.com/browserbase/stagehand/commit/08907ebbc2cb47cfc3151946764656a7f4ce99c6) Thanks [@kamath](https://github.com/kamath)! - exposed llmClient in stagehand constructor

### Patch Changes

- [#383](https://github.com/browserbase/stagehand/pull/383) [`a77efcc`](https://github.com/browserbase/stagehand/commit/a77efccfde3a3948013eda3a52935e8a21d45b3e) Thanks [@sameelarif](https://github.com/sameelarif)! - Unified LLM input/output types for reduced dependence on OpenAI types

- [`b7b3701`](https://github.com/browserbase/stagehand/commit/b7b370160bf35b09f5dc132f6e86f6e34fb70a85) Thanks [@kamath](https://github.com/kamath)! - Fix $1-types exposed to the user

- [#353](https://github.com/browserbase/stagehand/pull/353) [`5c6f14b`](https://github.com/browserbase/stagehand/commit/5c6f14bade201e08cb86d2e14e246cb65707f7ee) Thanks [@kamath](https://github.com/kamath)! - Throw custom error if context is referenced without initialization, remove act/extract handler from index

- [#360](https://github.com/browserbase/stagehand/pull/360) [`89841fc`](https://github.com/browserbase/stagehand/commit/89841fc42ae82559baddfe2a9593bc3260c082a2) Thanks [@kamath](https://github.com/kamath)! - Remove stagehand nav entirely

- [#379](https://github.com/browserbase/stagehand/pull/379) [`b1c6579`](https://github.com/browserbase/stagehand/commit/b1c657976847de86d82324030f90c2f6a1f3f976) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - dont require LLM Client to use non-ai stagehand functions

- [#371](https://github.com/browserbase/stagehand/pull/371) [`30e7d09`](https://github.com/browserbase/stagehand/commit/30e7d091445004c71aec1748d3a7d75fb86d1f11) Thanks [@kamath](https://github.com/kamath)! - pretty readme :)

- [#382](https://github.com/browserbase/stagehand/pull/382) [`a41271b`](https://github.com/browserbase/stagehand/commit/a41271baf351e20f4c79b4b654d8a947b615a121) Thanks [@sameelarif](https://github.com/sameelarif)! - Added example implementation of the Vercel AI SDK as an LLMClient

- [#344](https://github.com/browserbase/stagehand/pull/344) [`c1cf345`](https://github.com/browserbase/stagehand/commit/c1cf34535ed30262989b1dbe262fb0414cdf8230) Thanks [@kamath](https://github.com/kamath)! - Remove duplicate logging and expose Page/BrowserContext types

## 1.8.0

### Minor Changes

- [#324](https://github.com/browserbase/stagehand/pull/324) [`cd23fa3`](https://github.com/browserbase/stagehand/commit/cd23fa33450107f29cb1ddb6edadfc769d336aa5) Thanks [@kamath](https://github.com/kamath)! - Move stagehand.act() -> stagehand.page.act() and deprecate stagehand.act()

- [#319](https://github.com/browserbase/stagehand/pull/319) [`bacbe60`](https://github.com/browserbase/stagehand/commit/bacbe608058304bfa1f0ab049da4d8aa90e8d6f7) Thanks [@kamath](https://github.com/kamath)! - We now wrap playwright page/context within StagehandPage and StagehandContext objects. This helps us augment the Stagehand experience by being able to augment the underlying Playwright

- [#324](https://github.com/browserbase/stagehand/pull/324) [`cd23fa3`](https://github.com/browserbase/stagehand/commit/cd23fa33450107f29cb1ddb6edadfc769d336aa5) Thanks [@kamath](https://github.com/kamath)! - moves extract and act -> page and deprecates stagehand.extract and stagehand.observe

### Patch Changes

- [#320](https://github.com/browserbase/stagehand/pull/320) [`c0cdd0e`](https://github.com/browserbase/stagehand/commit/c0cdd0e985d66f0464d2e70b7d0cb343b0efbd3f) Thanks [@kamath](https://github.com/kamath)! - bug fix: set this.env to LOCAL if BROWSERBASE_API_KEY is not defined

- [#325](https://github.com/browserbase/stagehand/pull/325) [`cc46f34`](https://github.com/browserbase/stagehand/commit/cc46f345c0a1dc0af4abae7e207833df17da50e7) Thanks [@pkiv](https://github.com/pkiv)! - only start domdebug if enabled

## 1.7.0

### Minor Changes

- [#316](https://github.com/browserbase/stagehand/pull/316) [`902e633`](https://github.com/browserbase/stagehand/commit/902e633e126a58b80b757ea0ecada01a7675a473) Thanks [@kamath](https://github.com/kamath)! - rename browserbaseResumeSessionID -> browserbaseSessionID

- [#296](https://github.com/browserbase/stagehand/pull/296) [`f11da27`](https://github.com/browserbase/stagehand/commit/f11da27a20409c240ceeea2003d520f676def61a) Thanks [@kamath](https://github.com/kamath)! - - Deprecate fields in `init` in favor of constructor options

  - Deprecate `initFromPage` in favor of `browserbaseResumeSessionID` in constructor
  - Rename `browserBaseSessionCreateParams` -> `browserbaseSessionCreateParams`

- [#304](https://github.com/browserbase/stagehand/pull/304) [`0b72f75`](https://github.com/browserbase/stagehand/commit/0b72f75f6a62aaeb28b0c488ae96db098d6a2846) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add textExtract: an optional, text based approach to the existing extract method. textExtract often performs better on long form extraction tasks. By default `extract` uses the existing approach `domExtract`.

- [#298](https://github.com/browserbase/stagehand/pull/298) [`55f0cd2`](https://github.com/browserbase/stagehand/commit/55f0cd2fe7976e800833ec6e41e9af62d88d09d5) Thanks [@kamath](https://github.com/kamath)! - Add sessionId to public params

### Patch Changes

- [#283](https://github.com/browserbase/stagehand/pull/283) [`b902192`](https://github.com/browserbase/stagehand/commit/b902192bc7ff8eb02c85150c1fe6f89c2a95b211) Thanks [@sameelarif](https://github.com/sameelarif)! - allowed customization of eval config via .env

- [#299](https://github.com/browserbase/stagehand/pull/299) [`fbe2300`](https://github.com/browserbase/stagehand/commit/fbe23007176488043c2415519f25021612fff989) Thanks [@sameelarif](https://github.com/sameelarif)! - log playwright actions for better debugging

## 1.6.0

### Minor Changes

- [#286](https://github.com/browserbase/stagehand/pull/286) [`9605836`](https://github.com/browserbase/stagehand/commit/9605836ee6b8207ed7dc9146e12ced1c78630d59) Thanks [@kamath](https://github.com/kamath)! - minor improvement in action + new eval case

- [#279](https://github.com/browserbase/stagehand/pull/279) [`d6d7057`](https://github.com/browserbase/stagehand/commit/d6d70570623a718354797ef83aa8489eacc085d1) Thanks [@kamath](https://github.com/kamath)! - Add support for o1-mini and o1-preview in OpenAIClient

- [#282](https://github.com/browserbase/stagehand/pull/282) [`5291797`](https://github.com/browserbase/stagehand/commit/529179724a53bf2fd578a4012fd6bc6b7348d1ae) Thanks [@kamath](https://github.com/kamath)! - Added eslint for stricter type checking. Streamlined most of the internal types throughout the cache, llm, and handlers. This should make it easier to add new LLMs down the line, maintain and update the existing code, and make it easier to add new features in the future. Types can be checked by running `npx eslint .` from the project directory.

### Patch Changes

- [#270](https://github.com/browserbase/stagehand/pull/270) [`6b10b3b`](https://github.com/browserbase/stagehand/commit/6b10b3b1160649b19f50d66588395ceb679b3d68) Thanks [@sameelarif](https://github.com/sameelarif)! - add close link to readme

- [#288](https://github.com/browserbase/stagehand/pull/288) [`5afa0b9`](https://github.com/browserbase/stagehand/commit/5afa0b940a9f379a3719a5bbae249dd2a9ef8380) Thanks [@kamath](https://github.com/kamath)! - add multi-region support for browserbase

- [#284](https://github.com/browserbase/stagehand/pull/284) [`474217c`](https://github.com/browserbase/stagehand/commit/474217cfaff8e68614212b66baa62d35493fd2ce) Thanks [@kamath](https://github.com/kamath)! - Build wasn't working, this addresses tsc failure.

- [#236](https://github.com/browserbase/stagehand/pull/236) [`85483fe`](https://github.com/browserbase/stagehand/commit/85483fe091544fc079015c62b6923b03f8b9caa7) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - reduce chunk size

## 1.5.0

### Minor Changes

- [#266](https://github.com/browserbase/stagehand/pull/266) [`0e8f34f`](https://github.com/browserbase/stagehand/commit/0e8f34fc15aee91c548d09534deaccc8adca7c4d) Thanks [@kamath](https://github.com/kamath)! - Install wasn't working from NPM due to misconfigured build step. This attempts to fix that.

## 1.4.0

### Minor Changes

- [#253](https://github.com/browserbase/stagehand/pull/253) [`598cae2`](https://github.com/browserbase/stagehand/commit/598cae230c7b8d4e31ae22fd63047a91b63e51b8) Thanks [@sameelarif](https://github.com/sameelarif)! - clean up contexts after use

### Patch Changes

- [#225](https://github.com/browserbase/stagehand/pull/225) [`a2366fe`](https://github.com/browserbase/stagehand/commit/a2366feb023180fbb2ccc7a8379692f9f8347fe5) Thanks [@sameelarif](https://github.com/sameelarif)! - Ensuring cross-platform compatibility with tmp directories

- [#249](https://github.com/browserbase/stagehand/pull/249) [`7d06d43`](https://github.com/browserbase/stagehand/commit/7d06d43f2b9a477fed35793d7479de9b183e8d53) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix broken evals

- [#227](https://github.com/browserbase/stagehand/pull/227) [`647eefd`](https://github.com/browserbase/stagehand/commit/647eefd651852eec495faa1b8f4dbe6b1da17999) Thanks [@kamath](https://github.com/kamath)! - Fix debugDom still showing chunks when set to false

- [#250](https://github.com/browserbase/stagehand/pull/250) [`5886620`](https://github.com/browserbase/stagehand/commit/5886620dd1b0a57c68bf810cf130df2ca0a50a69) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add ci specific evals

- [#222](https://github.com/browserbase/stagehand/pull/222) [`8dff026`](https://github.com/browserbase/stagehand/commit/8dff02674df7a6448f2262c7e212b58c03be57bc) Thanks [@sameelarif](https://github.com/sameelarif)! - Streamline type definitions and fix existing typescript errors

- [#232](https://github.com/browserbase/stagehand/pull/232) [`b9f9949`](https://github.com/browserbase/stagehand/commit/b9f99494021e6a9e2487b77bb64ed0a491751400) Thanks [@kamath](https://github.com/kamath)! - Minor changes to package.json and tsconfig, mainly around the build process. Also add more type defs and remove unused dependencies.

## 1.3.0

### Minor Changes

- [#195](https://github.com/browserbase/stagehand/pull/195) [`87a6305`](https://github.com/browserbase/stagehand/commit/87a6305d9a2faf1ab5915965913bc14d5cc15772) Thanks [@kamath](https://github.com/kamath)! - - Adds structured and more standardized JSON logging
  - Doesn't init cache if `enableCaching` is false, preventing `tmp/.cache` from being created
  - Updates bundling for browser-side code to support NextJS and serverless

## 1.2.0

### Minor Changes

- [#179](https://github.com/browserbase/stagehand/pull/179) [`0031871`](https://github.com/browserbase/stagehand/commit/0031871d5a6d6180f272a68b88a8634e5a991785) Thanks [@navidkpr](https://github.com/navidkpr)! - Fixes:

  The last big change we pushed out, introduced a small regression. As a result, the gray outline showing the elements Stagehand is looking out is missing. This commit fixes that. We now process selectorMap properly now (using the updated type Record<number, string[]

  Improved the action prompt:

  Improved the structure
  Made it more straightforward
  Improved working for completed arg and prioritized precision over recall

## 1.1.0

### Minor Changes

- [`9206ec6`](https://github.com/browserbase/stagehand/commit/9206ec640b2d0af9170f0a31788ab1eac448357b) Thanks [@kamath](https://github.com/kamath)! - Connect to a minor session


================================================
FILE: LICENSE
================================================
MIT License

Copyright (c) 2024 Browserbase Inc.

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: README.md
================================================
<div id="toc" align="center" style="margin-bottom: 0;">
  <ul style="list-style: none; margin: 0; padding: 0;">
    <a href="https://stagehand.dev">
      <picture>
        <source media="(prefers-color-scheme: dark)" srcset="media/dark_logo.png" />
        <img alt="Stagehand" src="media/light_logo.png" width="200" style="margin-right: 30px;" />
      </picture>
    </a>
  </ul>
</div>
<p align="center">
  <strong>The AI Browser Automation Framework</strong><br>
  <a href="https://docs.stagehand.dev">Read the Docs</a>
</p>

<p align="center">
  <a href="https://github.com/browserbase/stagehand/tree/main?tab=MIT-1-ov-file#MIT-1-ov-file">
    <picture>
      <source media="(prefers-color-scheme: dark)" srcset="media/dark_license.svg" />
      <img alt="MIT License" src="media/light_license.svg" />
    </picture>
  </a>
  <a href="https://stagehand.dev/discord">
    <picture>
      <source media="(prefers-color-scheme: dark)" srcset="media/dark_discord.svg" />
      <img alt="Discord Community" src="media/light_discord.svg" />
    </picture>
  </a>
</p>

<p align="center">
	<a href="https://trendshift.io/repositories/12122" target="_blank"><img src="https://trendshift.io/api/badge/repositories/12122" alt="browserbase%2Fstagehand | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
</p>

<p align="center">
  <a href="https://deepwiki.com/browserbase/stagehand">
    <img alt="Ask DeepWiki" src="https://deepwiki.com/badge.svg" />
  </a>
</p>

<p align="center">
If you're looking for the Python implementation, you can find it 
<a href="https://github.com/browserbase/stagehand-python"> here</a>
</p>

<div align="center" style="display: flex; align-items: center; justify-content: center; gap: 4px; margin-bottom: 0;">
  <b>Vibe code</b>
  <span style="font-size: 1.05em;"> Stagehand with </span>
  <a href="https://director.ai" style="display: flex; align-items: center;">
    <span>Director</span>
  </a>
  <span> </span>
  <picture>
    <img alt="Director" src="media/director_icon.svg" width="25" />
  </picture>
</div>

## What is Stagehand?

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## Why Stagehand?

Most existing browser automation tools either require you to write low-level code in a framework like Selenium, Playwright, or Puppeteer, or use high-level agents that can be unpredictable in production. By letting developers choose what to write in code vs. natural language (and bridging the gap between the two) Stagehand is the natural choice for browser automations in production.

1. **Choose when to write code vs. natural language**: use AI when you want to navigate unfamiliar pages, and use code when you know exactly what you want to do.

2. **Go from AI-driven to repeatable workflows**: Stagehand lets you preview AI actions before running them, and also helps you easily cache repeatable actions to save time and tokens.

3. **Write once, run forever**: Stagehand's auto-caching combined with self-healing remembers previous actions, runs without LLM inference, and knows when to involve AI whenever the website changes and your automation breaks. 

## Getting Started

Start with Stagehand with one line of code, or check out our [Quickstart Guide](https://docs.stagehand.dev/v3/first-steps/quickstart) for more information:

```bash
npx create-browser-app
```

## Example

Here's how to build a sample browser automation with Stagehand:

```typescript
// Stagehand's CDP engine provides an optimized, low level interface to the browser built for automation
const page = stagehand.context.pages()[0];
await page.goto("https://github.com/browserbase");

// Use act() to execute individual actions
await stagehand.act("click on the stagehand repo");

// Use agent() for multi-step tasks
const agent = stagehand.agent();
await agent.execute("Get to the latest PR");

// Use extract() to get structured data from the page
const { author, title } = await stagehand.extract(
  "extract the author and title of the PR",
  z.object({
    author: z.string().describe("The username of the PR author"),
    title: z.string().describe("The title of the PR"),
  }),
);
```

## Documentation

Visit [docs.stagehand.dev](https://docs.stagehand.dev) to view the full documentation.


### Build and Run from Source

```bash
git clone https://github.com/browserbase/stagehand.git
cd stagehand
pnpm install
pnpm run build
pnpm run example # run the blank script at ./examples/example.ts
```

Stagehand is best when you have an API key for an LLM provider and Browserbase credentials. To add these to your project, run:

```bash
cp .env.example .env
nano .env # Edit the .env file to add API keys
```

### Installing from a branch

You can install and build Stagehand directly from a github branch using [gitpkg](https://github.com/EqualMa/gitpkg)

In your project's `package.json` set:
```json
"@browserbasehq/stagehand": "https://gitpkg.now.sh/browserbase/stagehand/packages/core?<branchName>",
```


## Contributing

> [!NOTE]
> We highly value contributions to Stagehand! For questions or support, please join our [Discord community](https://stagehand.dev/discord).

At a high level, we're focused on improving reliability, extensibility, speed, and cost in that order of priority. If you're interested in contributing, **bug fixes and small improvements are the best way to get started**. For more involved features, we strongly recommend reaching out to [Miguel Gonzalez](https://x.com/miguel_gonzf) or [Paul Klein](https://x.com/pk_iv) in our [Discord community](https://stagehand.dev/discord) before starting to ensure that your contribution aligns with our goals.

<!-- For more information, please see our [Contributing Guide](https://docs.stagehand.dev/examples/contributing). -->

## Acknowledgements

We'd like to thank the following people for their major contributions to Stagehand:
- [Paul Klein](https://github.com/pkiv)
- [Sean McGuire](https://github.com/seanmcguire12)
- [Miguel Gonzalez](https://github.com/miguelg719)
- [Sameel Arif](https://github.com/sameelarif)
- [Thomas Katwan](https://github.com/tkattkat)
- [Filip Michalsky](https://github.com/filip-michalsky)
- [Anirudh Kamath](https://github.com/kamath)
- [Jeremy Press](https://x.com/jeremypress)
- [Navid Pour](https://github.com/navidpour)

## License

Licensed under the MIT License.

Copyright 2025 Browserbase, Inc.


================================================
FILE: claude.md
================================================
# Stagehand Project

This is a project that uses Stagehand V3, a browser automation framework with AI-powered `act`, `extract`, `observe`, and `agent` methods.

The main class can be imported as `Stagehand` from `@browserbasehq/stagehand`.

**Key Classes:**

- `Stagehand`: Main orchestrator class providing `act`, `extract`, `observe`, and `agent` methods
- `context`: A `V3Context` object that manages browser contexts and pages
- `page`: Individual page objects accessed via `stagehand.context.pages()[i]` or created with `stagehand.context.newPage()`

## Initialize

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL", // or "BROWSERBASE"
  verbose: 2, // 0, 1, or 2
  model: "openai/gpt-4.1-mini", // or any supported model
});

await stagehand.init();

// Access the browser context and pages
const page = stagehand.context.pages()[0];
const context = stagehand.context;

// Create new pages if needed
const page2 = await stagehand.context.newPage();
```

## Act

Actions are called on the `stagehand` instance (not the page). Use atomic, specific instructions:

```typescript
// Act on the current active page
await stagehand.act("click the sign in button");

// Act on a specific page (when you need to target a page that isn't currently active)
await stagehand.act("click the sign in button", { page: page2 });
```

**Important:** Act instructions should be atomic and specific:

- ✅ Good: "Click the sign in button" or "Type 'hello' into the search input"
- ❌ Bad: "Order me pizza" or "Type in the search bar and hit enter" (multi-step)

### Observe + Act Pattern (Recommended)

Cache the results of `observe` to avoid unexpected DOM changes:

```typescript
const instruction = "Click the sign in button";

// Get candidate actions
const actions = await stagehand.observe(instruction);

// Execute the first action
await stagehand.act(actions[0]);
```

To target a specific page:

```typescript
const actions = await stagehand.observe("select blue as the favorite color", {
  page: page2,
});
await stagehand.act(actions[0], { page: page2 });
```

## Extract

Extract data from pages using natural language instructions. The `extract` method is called on the `stagehand` instance.

### Basic Extraction (with schema)

```typescript
import { z } from "zod";

// Extract with explicit schema
const data = await stagehand.extract(
  "extract all apartment listings with prices and addresses",
  z.object({
    listings: z.array(
      z.object({
        price: z.string(),
        address: z.string(),
      }),
    ),
  }),
);

console.log(data.listings);
```

### Simple Extraction (without schema)

```typescript
// Extract returns a default object with 'extraction' field
const result = await stagehand.extract("extract the sign in button text");

console.log(result);
// Output: { extraction: "Sign in" }

// Or destructure directly
const { extraction } = await stagehand.extract(
  "extract the sign in button text",
);
console.log(extraction); // "Sign in"
```

### Targeted Extraction

Extract data from a specific element using a selector:

```typescript
const reason = await stagehand.extract(
  "extract the reason why script injection fails",
  z.string(),
  { selector: "/html/body/div[2]/div[3]/iframe/html/body/p[2]" },
);
```

### URL Extraction

When extracting links or URLs, use `z.string().url()`:

```typescript
const { links } = await stagehand.extract(
  "extract all navigation links",
  z.object({
    links: z.array(z.string().url()),
  }),
);
```

### Extracting from a Specific Page

```typescript
// Extract from a specific page (when you need to target a page that isn't currently active)
const data = await stagehand.extract(
  "extract the placeholder text on the name field",
  { page: page2 },
);
```

## Observe

Plan actions before executing them. Returns an array of candidate actions:

```typescript
// Get candidate actions on the current active page
const [action] = await stagehand.observe("Click the sign in button");

// Execute the action
await stagehand.act(action);
```

Observing on a specific page:

```typescript
// Target a specific page (when you need to target a page that isn't currently active)
const actions = await stagehand.observe("find the next page button", {
  page: page2,
});
await stagehand.act(actions[0], { page: page2 });
```

## Agent

Use the `agent` method to autonomously execute complex, multi-step tasks.

### Basic Agent Usage

```typescript
const page = stagehand.context.pages()[0];
await page.goto("https://www.google.com");

const agent = stagehand.agent({
  model: "google/gemini-2.0-flash",
  executionModel: "google/gemini-2.0-flash",
});

const result = await agent.execute({
  instruction: "Search for the stock price of NVDA",
  maxSteps: 20,
});

console.log(result.message);
```

### Computer Use Agent (CUA)

For more advanced scenarios using computer-use models:

```typescript
const agent = stagehand.agent({
  mode: "cua", // Enable Computer Use Agent mode
  model: "anthropic/claude-sonnet-4-20250514",
  // or "google/gemini-2.5-computer-use-preview-10-2025"
  systemPrompt: `You are a helpful assistant that can use a web browser.
    Do not ask follow up questions, the user will trust your judgement.`,
});

await agent.execute({
  instruction: "Apply for a library card at the San Francisco Public Library",
  maxSteps: 30,
});
```

### Agent with Custom Model Configuration

```typescript
const agent = stagehand.agent({
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GEMINI_API_KEY,
  },
  systemPrompt: `You are a helpful assistant.`,
});
```

### Agent with Integrations (MCP/External Tools)

```typescript
const agent = stagehand.agent({
  integrations: [`https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`],
  systemPrompt: `You have access to the Exa search tool.`,
});
```

### Agent Hybrid Mode

Hybrid mode uses both DOM-based and coordinate-based tools (act, click, type, dragAndDrop) for visual interactions. This requires `experimental: true` and models that support reliable coordinate-based actions.

**Recommended models for hybrid mode:**

- `google/gemini-3-flash-preview`
- `anthropic/claude-sonnet-4-20250514`, `anthropic/claude-sonnet-4-5-20250929`, `anthropic/claude-haiku-4-5-20251001`

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for hybrid mode
});
await stagehand.init();

const agent = stagehand.agent({
  mode: "hybrid",
  model: "google/gemini-3-flash-preview",
});

await agent.execute({
  instruction: "Click the submit button and fill the form",
  maxSteps: 20,
  highlightCursor: true, // Enabled by default in hybrid mode
});
```

**Agent modes:**

- `"dom"` (default): Uses DOM-based tools (act, fillForm) - works with any model
- `"hybrid"`: Uses both DOM-based and coordinate-based tools (act, click, type, dragAndDrop) - requires grounding-capable models
- `"cua"`: Uses Computer Use Agent providers

## Advanced Features

### DeepLocator (XPath Targeting)

Target specific elements across shadow DOM and iframes:

```typescript
await page
  .deepLocator("/html/body/div[2]/div[3]/iframe/html/body/p")
  .highlight({
    durationMs: 5000,
    contentColor: { r: 255, g: 0, b: 0 },
  });
```

### Multi-Page Workflows

```typescript
const page1 = stagehand.context.pages()[0];
await page1.goto("https://example.com");

const page2 = await stagehand.context.newPage();
await page2.goto("https://example2.com");

// Act/extract/observe operate on the current active page by default
// Pass { page } option to target a specific page
await stagehand.act("click button", { page: page1 });
await stagehand.extract("get title", { page: page2 });
```


================================================
FILE: eslint.config.mjs
================================================
import globals from "globals";
import pluginJs from "@eslint/js";
import tseslint from "typescript-eslint";
import security from "eslint-plugin-security";

/** @type {import('eslint').Linter.Config[]} */
export default [
  { files: ["**/*.{js,mjs,cjs,ts}"] },
  { languageOptions: { globals: globals.browser } },
  {
    files: ["packages/core/scripts/**/*.{js,cjs,mjs}"],
    languageOptions: { globals: globals.node },
  },
  {
    files: [
      "packages/server-v3/scripts/**/*.{js,cjs,mjs,ts}",
      "packages/server-v4/scripts/**/*.{js,cjs,mjs,ts}",
    ],
    languageOptions: { globals: globals.node },
  },
  {
    files: ["packages/cli/**/*.{js,cjs,mjs,ts}"],
    languageOptions: { globals: globals.node },
  },
  {
    ignores: [
      "**/dist/**",
      "**/node_modules/**",
      "packages/core/lib/dom/build/**",
      "packages/core/lib/v3/dom/build/**",
      "packages/core/lib/v4/dom/build/**",
      "packages/core/scripts/prepare.js",
      "**/*.config.js",
      "**/*.config.mjs",
      ".browserbase/**",
      "**/.browserbase/**",
      "**/*.json",
      "stainless.yml",
      "packages/server-v3/openapi.v3.yaml",
      "packages/server-v4/openapi.v4.yaml",
    ],
  },
  pluginJs.configs.recommended,
  ...tseslint.configs.recommended,
  {
    plugins: {
      security,
    },
    rules: {
      "no-eval": "error",
      "no-implied-eval": "error",
      "no-new-func": "error",
      "security/detect-eval-with-expression": "error",
      "preserve-caught-error": "error",
      "no-restricted-syntax": [
        "error",
        {
          selector: "CallExpression[callee.name='Function']",
          message: "Dynamic function construction is prohibited.",
        },
        {
          selector: "NewExpression[callee.name='Function']",
          message: "Dynamic function construction is prohibited.",
        },
        {
          selector:
            "CallExpression[callee.object.name='window'][callee.property.name='Function']",
          message:
            "Dynamic function construction via window.Function is prohibited.",
        },
        {
          selector:
            "CallExpression[callee.object.name='globalThis'][callee.property.name='Function']",
          message:
            "Dynamic function construction via globalThis.Function is prohibited.",
        },
      ],
    },
  },
  {
    files: ["packages/cli/**/*.{js,cjs,mjs,ts}"],
    rules: {
      "no-empty": ["error", { allowEmptyCatch: true }],
    },
  },
];


================================================
FILE: package.json
================================================
{
  "name": "stagehand-workspace",
  "version": "0.0.0",
  "private": true,
  "description": "Stagehand monorepo workspace",
  "type": "module",
  "scripts": {
    "build": "turbo run build",
    "build:full": "turbo run build",
    "build:cjs": "turbo run build:cjs",
    "build:cli": "turbo run build:cli",
    "build:esm": "turbo run build:esm",
    "build:sea": "turbo run build:sea:esm",
    "build:sea:esm": "turbo run build:sea:esm",
    "build:sea:cjs": "turbo run build:sea:cjs",
    "lint": "turbo run lint",
    "format": "prettier --write .",
    "prettier": "prettier --write .",
    "eslint": "eslint .",
    "test": "turbo run test:core test:e2e test:server test:evals test:cli",
    "test:core": "turbo run test:core --",
    "test:core:local": "STAGEHAND_BROWSER_TARGET=local pnpm run test:core --",
    "test:core:bb": "STAGEHAND_BROWSER_TARGET=browserbase pnpm run test:core --",
    "test:e2e": "turbo run test:e2e --",
    "test:e2e:local": "STAGEHAND_BROWSER_TARGET=local pnpm run test:e2e --",
    "test:e2e:bb": "STAGEHAND_BROWSER_TARGET=browserbase pnpm run test:e2e --",
    "test:server": "turbo run test:server --",
    "test:server:sea": "STAGEHAND_SERVER_TARGET=sea pnpm run test:server --",
    "test:server:local": "STAGEHAND_SERVER_TARGET=local pnpm run test:server --",
    "test:server:remote": "STAGEHAND_SERVER_TARGET=remote pnpm run test:server --",
    "test:evals": "turbo run test:evals --",
    "test:evals:local": "STAGEHAND_BROWSER_TARGET=local pnpm run test:evals --",
    "test:evals:bb": "STAGEHAND_BROWSER_TARGET=browserbase pnpm run test:evals --",
    "coverage:merge": "pnpm -w exec tsx packages/core/scripts/coverage.ts merge",
    "docs": "turbo run docs",
    "dev": "turbo run dev",
    "example": "pnpm --filter @browserbasehq/stagehand run example --",
    "cache:clear": "turbo run build --force",
    "prepare": "node packages/core/scripts/prepare.js",
    "release": "turbo run build && changeset publish",
    "release-canary": "turbo run build && changeset version --snapshot && changeset publish --tag alpha"
  },
  "devDependencies": {
    "@changesets/changelog-github": "^0.5.0",
    "@changesets/cli": "^2.27.9",
    "@eslint/js": "^10.0.1",
    "c8": "^10.1.3",
    "dotenv": "^17.3.1",
    "esbuild": "0.27.2",
    "eslint": "^10.0.2",
    "eslint-plugin-security": "^3.0.1",
    "globals": "^15.13.0",
    "junit-to-ctrf": "^0.0.14",
    "prettier": "^3.2.5",
    "source-map": "^0.7.4",
    "tsx": "^4.19.4",
    "turbo": "^2.8.10",
    "typescript": "5.8.3",
    "typescript-eslint": "^8.56.1"
  },
  "repository": {
    "type": "git",
    "url": "git+https://github.com/browserbase/stagehand.git"
  },
  "bugs": {
    "url": "https://github.com/browserbase/stagehand/issues"
  },
  "homepage": "https://stagehand.dev",
  "overrides": {
    "whatwg-url": "^14.0.0",
    "jwa": "^2.0.1",
    "zod": "4.2.1",
    "tsx": "4.19.4"
  },
  "engines": {
    "node": "^20.19.0 || >=22.12.0"
  },
  "packageManager": "pnpm@9.15.0+sha512.76e2379760a4328ec4415815bcd6628dee727af3779aaa4c914e3944156c4299921a89f976381ee107d41f12cfa4b66681ca9c718f0668fa0831ed4c6d8ba56c"
}


================================================
FILE: packages/README.md
================================================
# Stagehand Packages

This directory contains the Stagehand monorepo packages:

- **core** - The main Stagehand package
- **evals** - Evals CLI
- **docs** - [Docs](https://docs.stagehand.dev)
- **server** - Fastify server wrapping the core package for different language clients

================================================
FILE: packages/cli/CHANGELOG.md
================================================
# @browserbasehq/browse-cli

## 0.2.0

### Minor Changes

- [#1816](https://github.com/browserbase/stagehand/pull/1816) [`687d54a`](https://github.com/browserbase/stagehand/commit/687d54addad5625f28d51c6994170c7b629871f2) Thanks [@shrey150](https://github.com/shrey150)! - Add `--context-id` and `--persist` flags to `browse open` for loading and persisting Browserbase Contexts across sessions

- [#1793](https://github.com/browserbase/stagehand/pull/1793) [`e38c13b`](https://github.com/browserbase/stagehand/commit/e38c13b7526b140b693152ef1ffda88a74e9c425) Thanks [@shrey150](https://github.com/shrey150)! - Initial release of browse CLI - browser automation for AI agents

### Patch Changes

- [#1806](https://github.com/browserbase/stagehand/pull/1806) [`f8c7738`](https://github.com/browserbase/stagehand/commit/f8c773898f4d97e8854cc67a0b18eb7d1cdd7b75) Thanks [@shrey150](https://github.com/shrey150)! - Fix `browse env` showing stale mode after `browse env remote`

- Updated dependencies [[`505e8c6`](https://github.com/browserbase/stagehand/commit/505e8c6736f3706328dbc8df670c49a018058388), [`2f43ffa`](https://github.com/browserbase/stagehand/commit/2f43ffac11778152d17e4c44405770cc32c3ec8c), [`63ee247`](https://github.com/browserbase/stagehand/commit/63ee247ac6bf2992046d4f6b2759f46b15643e36), [`7dc35f5`](https://github.com/browserbase/stagehand/commit/7dc35f5e25689e6518d68b25ef71536d2781c8aa), [`335cf47`](https://github.com/browserbase/stagehand/commit/335cf4730e73bce33e92331d04bda4b0fd42685d), [`6ba0a1d`](https://github.com/browserbase/stagehand/commit/6ba0a1db7fc2d5d5a2f8927b1417d8f1d15eda10), [`4ff3bb8`](https://github.com/browserbase/stagehand/commit/4ff3bb831a6ef6e2d57148e7afb68ea8d23e395d), [`c27054b`](https://github.com/browserbase/stagehand/commit/c27054bbd0508431ade91d655f89efc87bbf5867), [`2abf5b9`](https://github.com/browserbase/stagehand/commit/2abf5b90f1e2bb1442509ef3a686b6128c9cdcf6), [`7817fcc`](https://github.com/browserbase/stagehand/commit/7817fcc315eee4455ce04567cf56c9ec801caf0b), [`7390508`](https://github.com/browserbase/stagehand/commit/73905088c5ed5923d276da9cce2efd0a0a3a46eb), [`611f43a`](https://github.com/browserbase/stagehand/commit/611f43ac8d4c580216d55d2b217c14a9a9c11013), [`521a10e`](https://github.com/browserbase/stagehand/commit/521a10e3698fc5631e219947bc90dad0f8bddaa8), [`2402a3c`](https://github.com/browserbase/stagehand/commit/2402a3c4d50270391b3e6440f4385cdcf5e1eb64)]:
  - @browserbasehq/stagehand@3.2.0


================================================
FILE: packages/cli/README.md
================================================
# Browse CLI

Browser automation CLI for AI agents. Built on [Stagehand](https://github.com/browserbase/stagehand), providing raw browser control without requiring LLM integration.

## Installation

```bash
npm install -g @browserbasehq/browse-cli
```

Requires Chrome/Chromium installed on the system.

## Quick Start

```bash
# Navigate to a URL (auto-starts browser daemon)
browse open https://example.com

# Take a snapshot to get element refs
browse snapshot -c

# Click an element by ref
browse click @0-5

# Type text
browse type "Hello, world!"

# Take a screenshot
browse screenshot ./page.png

# Stop the browser
browse stop
```

## How It Works

Browse uses a daemon architecture for fast, stateful interactions:

1. **First command** auto-starts a Chrome browser daemon
2. **Subsequent commands** reuse the same browser session
3. **State persists** between commands (cookies, refs, etc.)
4. **Multiple sessions** supported via `--session` or `BROWSE_SESSION` env var

### Self-Healing Sessions

The CLI automatically recovers from stale sessions. If the daemon or Chrome crashes:
1. Detects the failure
2. Cleans up stale processes and files
3. Restarts the daemon
4. Retries the command

Agents don't need to handle recovery - commands "just work".

## Commands

### Navigation

```bash
browse open <url> [--wait load|domcontentloaded|networkidle] [-t|--timeout ms]
browse reload
browse back
browse forward
```

The `--timeout` flag (default: 30000ms) controls how long to wait for the page load state. Use longer timeouts for slow-loading pages:

```bash
browse open https://slow-site.com --timeout 60000
```

### Click Actions

```bash
browse click <ref> [-b left|right|middle] [-c count]  # Click by ref (e.g., @0-5)
browse click_xy <x> <y> [--button] [--xpath]          # Click at coordinates
```

### Coordinate Actions

```bash
browse hover <x> <y> [--xpath]
browse scroll <x> <y> <deltaX> <deltaY> [--xpath]
browse drag <fromX> <fromY> <toX> <toY> [--steps n] [--xpath]
```

### Keyboard

```bash
browse type <text> [-d delay] [--mistakes]
browse press <key>  # e.g., Enter, Tab, Cmd+A
```

### Forms

```bash
browse fill <selector> <value> [--no-press-enter]
browse select <selector> <values...>
browse highlight <selector> [-d duration]
```

### Page Info

```bash
browse get url
browse get title
browse get text <selector>
browse get html <selector>
browse get value <selector>
browse get box <selector>  # Returns center coordinates

browse snapshot [-c|--compact]  # Accessibility tree with refs
browse screenshot [path] [-f|--full-page] [-t png|jpeg]
```

### Waiting

```bash
browse wait load [state]
browse wait selector <selector> [-t timeout] [-s visible|hidden|attached|detached]
browse wait timeout <ms>
```

### Multi-Tab

```bash
browse pages          # List all tabs
browse newpage [url]  # Open new tab
browse tab_switch <n> # Switch to tab by index
browse tab_close [n]  # Close tab (default: last)
```

### Network Capture

Capture HTTP requests to the filesystem for inspection:

```bash
browse network on     # Start capturing requests
browse network off    # Stop capturing
browse network path   # Get capture directory path
browse network clear  # Clear captured requests
```

Captured requests are saved as directories:

```
/tmp/browse-default-network/
  001-GET-api.github.com-repos/
    request.json      # method, url, headers, body
    response.json     # status, headers, body, duration
```

### Daemon Control

```bash
browse start          # Explicitly start daemon
browse stop [--force] # Stop daemon
browse status         # Check daemon status
browse env [target]   # Show or switch environment: local | remote
```

### Environment Switching (Local vs Remote)

Use environment switching when an agent should keep the same command flow, but the
browser runtime needs to change:

- `local` runs Chrome on your machine (best for local debugging/dev loops)
- `remote` runs a Browserbase session (best for anti-bot hardening and cloud runs)

```bash
# Show active environment (if running) and desired environment for next start
browse env

# Switch current session to Browserbase (restarts daemon if needed)
browse env remote

# Switch back to local Chrome
browse env local
```

Behavior details:

- Environment is scoped per `--session`
- `browse env <target>` persists an override and restarts the daemon
- `browse stop` clears the override so next start falls back to env-var-based auto detection
- Auto detection defaults to:
  - `remote` when `BROWSERBASE_API_KEY` is set
  - `local` otherwise

## Global Options

| Option | Description |
|--------|-------------|
| `--session <name>` | Session name for multiple browsers (default: "default") |
| `--headless` | Run Chrome in headless mode |
| `--headed` | Run Chrome with visible window (default) |
| `--ws <url>` | Connect to existing Chrome via CDP WebSocket |
| `--json` | Output as JSON |

## Environment Variables

| Variable | Description |
|----------|-------------|
| `BROWSE_SESSION` | Default session name (alternative to `--session`) |
| `BROWSERBASE_API_KEY` | Browserbase API key (required for `browse env remote`) |
| `BROWSERBASE_PROJECT_ID` | Browserbase project ID (optional, passed through if set) |

## Element References

After running `browse snapshot`, you can reference elements by their ref ID:

```bash
# Get snapshot with refs
browse snapshot -c

# Output includes refs like [0-5], [1-2], etc.
# RootWebArea "Example" url="https://example.com"
#   [0-0] link "Home"
#   [0-1] link "About"
#   [0-2] button "Sign In"

# Click using ref (multiple formats supported)
browse click @0-2       # @ prefix
browse click 0-2        # Plain ref
browse click ref=0-2    # Explicit prefix
```

The full snapshot output includes mappings:
- **xpathMap**: Cross-frame XPath selectors
- **cssMap**: Fast CSS selectors when available
- **urlMap**: Extracted URLs from links

## Multiple Sessions

Run multiple browser instances simultaneously:

```bash
# Terminal 1
BROWSE_SESSION=session1 browse open https://google.com

# Terminal 2
BROWSE_SESSION=session2 browse open https://github.com

# Or use --session flag
browse --session work open https://slack.com
browse --session personal open https://twitter.com
```

## Direct CDP Connection

Connect to an existing Chrome instance:

```bash
# Start Chrome with remote debugging
google-chrome --remote-debugging-port=9222

# Connect via WebSocket
browse --ws ws://localhost:9222/devtools/browser/... open https://example.com
```

## Optimal AI Workflow

1. **Navigate** to target page (browser auto-starts)
2. **Snapshot** to get the accessibility tree with refs
3. **Click/Fill** using refs directly (e.g., `@0-5`)
4. **Re-snapshot** after actions to verify state changes
5. **Stop** when done

```bash
browse open https://example.com
browse snapshot -c
# [0-5] textbox: Search
# [0-8] button: Submit
browse fill @0-5 "my query"
browse click @0-8
browse snapshot -c  # Verify result
browse stop
```

## Troubleshooting

### Chrome not found

The CLI uses your system Chrome/Chromium. If not found:

```bash
# macOS - Install Chrome or set path
export CHROME_PATH=/Applications/Google\ Chrome.app/Contents/MacOS/Google\ Chrome

# Linux - Install chromium
sudo apt install chromium-browser
```

### Stale daemon

If the daemon becomes unresponsive:

```bash
browse stop --force
```

### Permission denied on socket

```bash
# Clean up stale socket files
rm /tmp/browse-*.sock /tmp/browse-*.pid
```

## Platform Support

- macOS (Intel and Apple Silicon)
- Linux (x64 and arm64)

Windows support requires WSL or TCP socket implementation.

## Development

```bash
# Clone and setup (in monorepo)
cd packages/cli
pnpm install         # Install dependencies first!
pnpm run build       # Build the CLI

# Run without building (for development)
pnpm run dev -- <command>

# Or with tsx directly
npx tsx src/index.ts <command>

# Run linting and formatting
pnpm run lint
pnpm run format
```

## License

MIT - see [LICENSE](./LICENSE)

## Related

- [Stagehand](https://github.com/browserbase/stagehand) - AI web browser automation framework
- [Browserbase](https://browserbase.com) - Cloud browser infrastructure


================================================
FILE: packages/cli/package.json
================================================
{
  "name": "@browserbasehq/browse-cli",
  "version": "0.2.0",
  "description": "Browser automation CLI for AI agents, built on Stagehand",
  "type": "commonjs",
  "license": "MIT",
  "author": "Browserbase <support@browserbase.com>",
  "repository": {
    "type": "git",
    "url": "git+https://github.com/browserbase/stagehand.git",
    "directory": "packages/cli"
  },
  "bugs": {
    "url": "https://github.com/browserbase/stagehand/issues"
  },
  "homepage": "https://github.com/browserbase/stagehand/tree/main/packages/cli#readme",
  "keywords": [
    "browser",
    "automation",
    "cli",
    "ai",
    "agent",
    "chrome",
    "cdp",
    "web-scraping",
    "testing",
    "stagehand"
  ],
  "engines": {
    "node": "^20.19.0 || >=22.12.0"
  },
  "publishConfig": {
    "access": "public"
  },
  "main": "./dist/index.js",
  "bin": {
    "browse": "./dist/index.js"
  },
  "files": [
    "dist",
    "README.md",
    "LICENSE"
  ],
  "scripts": {
    "build": "tsup",
    "dev": "tsx src/index.ts",
    "browse": "tsx src/index.ts",
    "typecheck": "tsc --noEmit",
    "eslint": "eslint .",
    "lint": "cd ../.. && prettier --check packages/cli && cd packages/cli && pnpm run eslint && pnpm run typecheck",
    "test": "vitest run",
    "test:cli": "vitest run",
    "test:watch": "vitest",
    "prepublishOnly": "pnpm run build"
  },
  "dependencies": {
    "@browserbasehq/stagehand": "workspace:*",
    "commander": "^12.0.0",
    "dotenv": "^16.4.5",
    "pino": "^9.6.0",
    "pino-pretty": "^13.0.0",
    "ws": "^8.18.0"
  },
  "devDependencies": {
    "@types/node": "^20.11.30",
    "devtools-protocol": "^0.0.1464554",
    "eslint": "^10.0.2",
    "tsup": "^8.2.1",
    "tsx": "^4.10.5",
    "typescript": "5.8.3",
    "vitest": "^4.0.8"
  }
}


================================================
FILE: packages/cli/src/index.ts
================================================
/**
 * Browse CLI - Browser automation for AI agents
 *
 * Usage:
 *   browse [options] <command> [args...]
 *
 * The CLI runs a daemon process that maintains browser state between commands.
 * Multiple sessions can run simultaneously using --session <name> or BROWSE_SESSION env var.
 */

import { Command } from "commander";
import { Stagehand, type Page as BrowsePage } from "@browserbasehq/stagehand";
import { promises as fs } from "fs";
import * as path from "path";
import * as os from "os";
import * as net from "net";
import { spawn } from "child_process";
import * as readline from "readline";
import type { Protocol } from "devtools-protocol";
import { version as VERSION } from "../package.json";

const program = new Command();

// Type aliases
type BrowseContext = Stagehand["context"];

// ==================== DAEMON INFRASTRUCTURE ====================

const SOCKET_DIR = os.tmpdir();

function getSocketPath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.sock`);
}

function getLockPath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.lock`);
}

/**
 * Acquire an exclusive lock for daemon operations.
 * Uses O_EXCL for atomic file creation to prevent race conditions.
 */
async function acquireLock(
  session: string,
  timeoutMs: number = 10000,
): Promise<boolean> {
  const lockPath = getLockPath(session);
  const startTime = Date.now();

  while (Date.now() - startTime < timeoutMs) {
    try {
      // O_EXCL ensures atomic creation - fails if file exists
      const handle = await fs.open(lockPath, "wx");
      await handle.write(String(process.pid));
      await handle.close();
      return true;
    } catch (err: unknown) {
      if ((err as NodeJS.ErrnoException).code === "EEXIST") {
        // Lock exists - check if holder is still alive
        try {
          const holderPid = parseInt(await fs.readFile(lockPath, "utf-8"));
          process.kill(holderPid, 0); // Throws if process doesn't exist
          // Process exists, wait and retry
          await new Promise((r) => setTimeout(r, 100));
        } catch {
          // Lock holder is dead, remove stale lock
          try {
            await fs.unlink(lockPath);
          } catch {}
        }
        continue;
      }
      throw err;
    }
  }
  return false;
}

async function releaseLock(session: string): Promise<void> {
  try {
    await fs.unlink(getLockPath(session));
  } catch {}
}

/**
 * Check if a socket is actually connectable (not just exists on disk).
 */
async function isSocketConnectable(
  socketPath: string,
  timeoutMs: number,
): Promise<boolean> {
  return new Promise((resolve) => {
    const client = net.createConnection(socketPath);
    const timeout = setTimeout(() => {
      client.destroy();
      resolve(false);
    }, timeoutMs);

    client.on("connect", () => {
      clearTimeout(timeout);
      client.destroy();
      resolve(true);
    });

    client.on("error", () => {
      clearTimeout(timeout);
      resolve(false);
    });
  });
}

/**
 * Wait for socket to become connectable with exponential backoff.
 */
async function waitForSocketReady(
  socketPath: string,
  timeoutMs: number,
): Promise<void> {
  const startTime = Date.now();
  let delay = 50;

  while (Date.now() - startTime < timeoutMs) {
    if (await isSocketConnectable(socketPath, 500)) return;
    await new Promise((r) => setTimeout(r, delay));
    delay = Math.min(delay * 1.5, 500);
  }
  throw new Error(`Socket not ready after ${timeoutMs}ms`);
}

function getPidPath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.pid`);
}

function getWsPath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.ws`);
}

function getChromePidPath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.chrome.pid`);
}

function getNetworkDir(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}-network`);
}

function getModePath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.mode`);
}

function getModeOverridePath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.mode-override`);
}

function getContextPath(session: string): string {
  return path.join(SOCKET_DIR, `browse-${session}.context`);
}

type BrowseMode = "browserbase" | "local";

function hasBrowserbaseCredentials(): boolean {
  return Boolean(process.env.BROWSERBASE_API_KEY);
}

function assertModeSupported(mode: BrowseMode): void {
  if (mode === "browserbase" && !hasBrowserbaseCredentials()) {
    throw new Error(
      "Remote mode requires BROWSERBASE_API_KEY. Set the env var or run `browse env local`.",
    );
  }
}

function toModeTarget(mode: BrowseMode): "local" | "remote" {
  return mode === "browserbase" ? "remote" : "local";
}

async function readCurrentMode(session: string): Promise<BrowseMode | null> {
  try {
    const mode = (await fs.readFile(getModePath(session), "utf-8")).trim();
    if (mode === "browserbase" || mode === "local") {
      return mode;
    }
  } catch {
    // File may not exist yet.
  }
  return null;
}

/** Determine desired mode: explicit override > env var detection */
async function getDesiredMode(session: string): Promise<BrowseMode> {
  try {
    const override = (
      await fs.readFile(getModeOverridePath(session), "utf-8")
    ).trim();
    if (override === "browserbase" || override === "local") return override;
  } catch {}
  return hasBrowserbaseCredentials() ? "browserbase" : "local";
}

async function isDaemonRunning(session: string): Promise<boolean> {
  try {
    const pidFile = getPidPath(session);
    const pid = parseInt(await fs.readFile(pidFile, "utf-8"));
    process.kill(pid, 0); // Check if process exists

    // Also verify socket exists and is actually connectable
    const socketPath = getSocketPath(session);
    await fs.access(socketPath);

    // Verify socket is actually connectable (not just exists on disk)
    return await isSocketConnectable(socketPath, 500);
  } catch {
    return false;
  }
}

/** Daemon state files — cleaned on both startup (stale) and shutdown. */
const DAEMON_STATE_FILES = (session: string) => [
  getSocketPath(session),
  getPidPath(session),
  getWsPath(session),
  getChromePidPath(session),
  getLockPath(session),
  getModePath(session),
];

async function cleanupStaleFiles(session: string): Promise<void> {
  const files = [
    ...DAEMON_STATE_FILES(session),
    // Context is client-written config, only cleaned on full shutdown
    getContextPath(session),
  ];

  for (const file of files) {
    try {
      await fs.unlink(file);
    } catch {}
  }
}

/** Like cleanupStaleFiles but preserves client-written config (context). */
async function cleanupDaemonStateFiles(session: string): Promise<void> {
  for (const file of DAEMON_STATE_FILES(session)) {
    try {
      await fs.unlink(file);
    } catch {}
  }
}

/** Find and kill Chrome processes for this session */
async function killChromeProcesses(session: string): Promise<boolean> {
  try {
    const { exec } = await import("child_process");
    const { promisify } = await import("util");
    const execAsync = promisify(exec);

    if (process.platform === "darwin" || process.platform === "linux") {
      // Find Chrome processes with our user data dir pattern
      const { stdout } = await execAsync(
        `pgrep -f "browse-${session}" || true`,
      );
      const pids = stdout.trim().split("\n").filter(Boolean);
      for (const pid of pids) {
        try {
          process.kill(parseInt(pid), "SIGTERM");
        } catch {}
      }
      return pids.length > 0;
    }
    return false;
  } catch {
    return false;
  }
}

interface DaemonRequest {
  command: string;
  args: unknown[];
}

interface DaemonResponse {
  success: boolean;
  result?: unknown;
  error?: string;
}

// ==================== DAEMON SERVER ====================

// Default viewport matching Stagehand core
const DEFAULT_VIEWPORT = { width: 1288, height: 711 };

async function runDaemon(session: string, headless: boolean): Promise<void> {
  // Only clean daemon state files (socket, pid, etc.), not client-written config (context)
  await cleanupDaemonStateFiles(session);

  // Write daemon PID file and initial mode so status is immediately available
  await fs.writeFile(getPidPath(session), String(process.pid));
  await fs.writeFile(getModePath(session), await getDesiredMode(session));

  // Browser state (initialized lazily on first command)
  let stagehand: Stagehand | null = null;
  let context: BrowseContext | null = null;
  let isInitializing = false;

  /**
   * Lazy browser initialization - called on first command (like agent-browser)
   * This allows daemon to signal "started" immediately without waiting for browser
   */
  async function ensureBrowserInitialized(): Promise<{
    stagehand: Stagehand;
    context: BrowseContext;
  }> {
    if (stagehand && context) {
      return { stagehand, context };
    }

    // Prevent concurrent initialization
    if (isInitializing) {
      // Wait for initialization to complete
      while (isInitializing) {
        await new Promise((resolve) => setTimeout(resolve, 100));
      }
      if (stagehand && context) {
        return { stagehand, context };
      }
      throw new Error("Browser initialization failed");
    }

    isInitializing = true;

    try {
      const desiredMode = await getDesiredMode(session);
      assertModeSupported(desiredMode);
      const useBrowserbase = desiredMode === "browserbase";

      // Read context config if present (written by `browse open --context-id`)
      let contextConfig: { id: string; persist?: boolean } | null = null;
      try {
        const raw = await fs.readFile(getContextPath(session), "utf-8");
        contextConfig = JSON.parse(raw);
      } catch {}

      stagehand = new Stagehand({
        env: useBrowserbase ? "BROWSERBASE" : "LOCAL",
        verbose: 0,
        disablePino: true,
        ...(useBrowserbase
          ? {
              disableAPI: true,
              ...(contextConfig
                ? {
                    browserbaseSessionCreateParams: {
                      browserSettings: {
                        context: contextConfig,
                      },
                    },
                  }
                : {}),
            }
          : {
              localBrowserLaunchOptions: {
                headless,
                viewport: DEFAULT_VIEWPORT,
              },
            }),
      });

      // Persist mode so status command can report it
      await fs.writeFile(getModePath(session), desiredMode);

      await stagehand.init();

      context = stagehand.context;

      // Try to save Chrome info for reference (best effort)
      try {
        const wsUrl = stagehand.connectURL();
        await fs.writeFile(getWsPath(session), wsUrl);
      } catch {}

      // Store session name for network capture
      networkSession = session;

      return { stagehand, context };
    } finally {
      isInitializing = false;
    }
  }

  // Create Unix socket server
  const socketPath = getSocketPath(session);
  const server = net.createServer((conn) => {
    const rl = readline.createInterface({ input: conn });

    rl.on("line", async (line) => {
      let response: DaemonResponse;
      try {
        const request: DaemonRequest = JSON.parse(line);

        // Lazy browser initialization on first command (like agent-browser)
        const { stagehand: sh, context: ctx } =
          await ensureBrowserInitialized();

        const result = await executeCommand(
          ctx,
          request.command,
          request.args,
          sh,
        );
        response = { success: true, result };
      } catch (e) {
        response = {
          success: false,
          error: e instanceof Error ? e.message : String(e),
        };
      }
      conn.write(JSON.stringify(response) + "\n");
    });

    rl.on("close", () => {
      conn.destroy();
    });
  });

  server.listen(socketPath);

  // Signal daemon started immediately (before browser initialization)
  console.log(JSON.stringify({ daemon: "started", session, pid: process.pid }));

  // Graceful shutdown handler
  let shuttingDown = false;
  const shutdown = async () => {
    if (shuttingDown) return;
    shuttingDown = true;

    server.close();

    try {
      if (stagehand) {
        await stagehand.close();
      }
    } catch {}

    await cleanupStaleFiles(session);
    process.exit(0);
  };

  // Handle all termination signals
  process.on("SIGTERM", () => shutdown());
  process.on("SIGINT", () => shutdown());
  process.on("SIGHUP", () => shutdown());
  process.on("uncaughtException", (err) => {
    console.error("Uncaught exception:", err);
    shutdown();
  });
  process.on("unhandledRejection", (reason) => {
    console.error("Unhandled rejection:", reason);
    shutdown();
  });

  // Keep daemon running (signal already sent above)
}

// ==================== REF MAP (cached from last snapshot) ====================

/** Cached ref maps from the last snapshot - allows @ref syntax in commands */
let refMap: {
  xpathMap: Record<string, string>;
  urlMap: Record<string, string>;
} = {
  xpathMap: {},
  urlMap: {},
};

// ==================== NETWORK CAPTURE STATE ====================

interface PendingRequest {
  id: string;
  timestamp: string;
  method: string;
  url: string;
  headers: Record<string, string>;
  body: string | null;
  resourceType: string;
}

let networkEnabled = false;
let networkDir: string | null = null;
let networkCounter = 0;
let networkSession: string | null = null;
const pendingRequests = new Map<string, PendingRequest>();

/** Sanitize a string for use in a filename */
function sanitizeForFilename(str: string, maxLen: number = 30): string {
  return str
    .replace(/[^a-zA-Z0-9.-]/g, "-")
    .replace(/-+/g, "-")
    .replace(/^-|-$/g, "")
    .slice(0, maxLen);
}

/** Generate a directory name for a request */
function getRequestDirName(
  counter: number,
  method: string,
  url: string,
): string {
  try {
    const parsed = new URL(url);
    const domain = sanitizeForFilename(parsed.hostname, 30);
    const pathPart = parsed.pathname.split("/").filter(Boolean)[0] || "root";
    const pathSlug = sanitizeForFilename(pathPart, 20);
    return `${String(counter).padStart(3, "0")}-${method}-${domain}-${pathSlug}`;
  } catch {
    return `${String(counter).padStart(3, "0")}-${method}-unknown`;
  }
}

/** Write request data to filesystem */
async function writeRequestToFs(
  request: PendingRequest,
): Promise<string | null> {
  if (!networkDir) return null;

  const dirName = getRequestDirName(
    networkCounter++,
    request.method,
    request.url,
  );
  const requestDir = path.join(networkDir, dirName);

  try {
    await fs.mkdir(requestDir, { recursive: true });

    const requestData = {
      id: request.id,
      timestamp: request.timestamp,
      method: request.method,
      url: request.url,
      headers: request.headers,
      body: request.body,
      resourceType: request.resourceType,
    };
    await fs.writeFile(
      path.join(requestDir, "request.json"),
      JSON.stringify(requestData, null, 2),
    );

    return requestDir;
  } catch (err) {
    console.error("Failed to write request:", err);
    return null;
  }
}

/** Write response data to filesystem */
async function writeResponseToFs(
  requestDir: string,
  response: {
    id: string;
    status: number;
    statusText: string;
    headers: Record<string, string>;
    mimeType: string;
    body: string | null;
    duration: number;
    error?: string;
  },
): Promise<void> {
  try {
    await fs.writeFile(
      path.join(requestDir, "response.json"),
      JSON.stringify(response, null, 2),
    );
  } catch (err) {
    console.error("Failed to write response:", err);
  }
}

/**
 * Parse a ref from a selector argument.
 * Supports: @0-3, @[0-3], [0-3], 0-3, ref=0-3
 */
function parseRef(selector: string): string | null {
  if (selector.startsWith("@")) {
    const rest = selector.slice(1);
    if (rest.startsWith("[") && rest.endsWith("]")) {
      return rest.slice(1, -1);
    }
    return rest;
  }
  if (
    selector.startsWith("[") &&
    selector.endsWith("]") &&
    /^\[\d+-\d+]$/.test(selector)
  ) {
    return selector.slice(1, -1);
  }
  if (selector.startsWith("ref=")) {
    return selector.slice(4);
  }
  if (/^\d+-\d+$/.test(selector)) {
    return selector;
  }
  return null;
}

/**
 * Resolve a selector - if it's a ref, look up from refMap.
 * Always uses XPath since CSS selectors cannot cross shadow DOM boundaries
 * and can cause issues with dynamically generated class names.
 */
function resolveSelector(selector: string): string {
  const ref = parseRef(selector);
  if (ref) {
    const xpath = refMap.xpathMap[ref];
    if (!xpath) {
      throw new Error(
        `Unknown ref "${ref}" - run snapshot first to populate refs (have ${Object.keys(refMap.xpathMap).length} refs)`,
      );
    }
    return xpath;
  }
  return selector;
}

// ==================== COMMAND EXECUTION ====================

async function executeCommand(
  context: BrowseContext,
  command: string,
  args: unknown[],
  stagehand?: Stagehand,
): Promise<unknown> {
  // Use awaitActivePage() like stagehand.act() does - handles popups and waits for page to be ready
  const page =
    command !== "pages" && command !== "newpage"
      ? await context.awaitActivePage()
      : context.activePage();
  if (!page && command !== "pages" && command !== "newpage") {
    throw new Error("No active page");
  }

  switch (command) {
    // Navigation
    case "open": {
      const [url, waitUntil, timeout] = args as [string, string?, number?];
      await page!.goto(url, {
        waitUntil: waitUntil as "load" | "domcontentloaded" | "networkidle",
        timeoutMs: timeout ?? 30000,
      });
      return { url: page!.url() };
    }
    case "reload": {
      await page!.reload();
      return { url: page!.url() };
    }
    case "back": {
      await page!.goBack();
      return { url: page!.url() };
    }
    case "forward": {
      await page!.goForward();
      return { url: page!.url() };
    }

    // Click by ref - uses stagehand.act with Action type (skips LLM, uses deterministic path)
    case "click": {
      const [selector] = args as [string];
      if (!stagehand) {
        throw new Error("Stagehand instance not available");
      }
      const resolved = resolveSelector(selector);

      // Construct an Action object (like observe() returns) to use the deterministic path
      const action = {
        selector: resolved,
        description: "click element",
        method: "click",
        arguments: [],
      };

      await stagehand.act(action);
      return { clicked: true };
    }

    // Click by coordinates
    case "click_xy": {
      const [x, y, opts] = args as [
        number,
        number,
        { button?: string; clickCount?: number; returnXPath?: boolean },
      ];
      const result = await page!.click(x, y, {
        button: (opts?.button as "left" | "right" | "middle") ?? "left",
        clickCount: opts?.clickCount ?? 1,
      });
      if (opts?.returnXPath) {
        return { clicked: true, xpath: result };
      }
      return { clicked: true };
    }
    case "hover": {
      const [x, y, opts] = args as [number, number, { returnXPath?: boolean }];
      const result = await page!.hover(x, y);
      if (opts?.returnXPath) {
        return { hovered: true, xpath: result };
      }
      return { hovered: true };
    }
    case "scroll": {
      const [x, y, deltaX, deltaY, opts] = args as [
        number,
        number,
        number,
        number,
        { returnXPath?: boolean },
      ];
      const result = await page!.scroll(x, y, deltaX, deltaY);
      if (opts?.returnXPath) {
        return { scrolled: true, xpath: result };
      }
      return { scrolled: true };
    }
    case "drag": {
      const [fromX, fromY, toX, toY, opts] = args as [
        number,
        number,
        number,
        number,
        {
          steps?: number;
          delay?: number;
          button?: string;
          returnXPath?: boolean;
        },
      ];

      const [fromXpath, toXpath] = await page!.dragAndDrop(
        fromX,
        fromY,
        toX,
        toY,
        {
          button: (opts?.button as "left" | "right" | "middle") ?? "left",
          steps: opts?.steps ?? 10,
          delay: opts?.delay ?? 0,
          returnXpath: opts?.returnXPath,
        },
      );

      if (opts?.returnXPath) {
        return {
          dragged: true,
          xpath: fromXpath,
          fromXpath,
          toXpath,
        };
      }
      return { dragged: true };
    }
    // Keyboard
    case "type": {
      const [text, opts] = args as [
        string,
        { delay?: number; mistakes?: boolean },
      ];
      await page!.type(text, {
        delay: opts?.delay,
        withMistakes: opts?.mistakes,
      });
      return { typed: true };
    }
    case "press": {
      const [key] = args as [string];
      await page!.keyPress(key);
      return { pressed: key };
    }

    // Element actions - use stagehand.act with Action type for reliable interaction
    case "fill": {
      const [selector, value, opts] = args as [
        string,
        string,
        { pressEnter?: boolean }?,
      ];
      if (!stagehand) {
        throw new Error("Stagehand instance not available");
      }
      const resolved = resolveSelector(selector);
      const action = {
        selector: resolved,
        description: "fill element",
        method: "fill",
        arguments: [value],
      };
      await stagehand.act(action);
      if (opts?.pressEnter) {
        await page!.keyPress("Enter");
      }
      return { filled: true, pressedEnter: opts?.pressEnter ?? false };
    }
    case "select": {
      const [selector, values] = args as [string, string[]];
      if (!stagehand) {
        throw new Error("Stagehand instance not available");
      }
      const resolved = resolveSelector(selector);
      // selectOption takes the first value as argument
      const action = {
        selector: resolved,
        description: "select option",
        method: "selectOption",
        arguments: [values[0] || ""],
      };
      await stagehand.act(action);
      return { selected: values };
    }
    case "highlight": {
      const [selector, duration] = args as [string, number?];
      await page!
        .deepLocator(resolveSelector(selector))
        .highlight({ durationMs: duration ?? 2000 });
      return { highlighted: true };
    }
    // Page info
    case "get": {
      const [what, selector] = args as [string, string?];
      switch (what) {
        case "url":
          return { url: page!.url() };
        case "title":
          return { title: await page!.title() };
        case "text":
          return {
            text: await page!
              .deepLocator(resolveSelector(selector!))
              .textContent(),
          };
        case "html":
          return {
            html: await page!
              .deepLocator(resolveSelector(selector!))
              .innerHtml(),
          };
        case "value":
          return {
            value: await page!
              .deepLocator(resolveSelector(selector!))
              .inputValue(),
          };
        case "box": {
          const { x, y } = await page!
            .deepLocator(resolveSelector(selector!))
            .centroid();
          return { x: Math.round(x), y: Math.round(y) };
        }
        case "visible":
          return {
            visible: await page!
              .deepLocator(resolveSelector(selector!))
              .isVisible(),
          };
        case "checked":
          return {
            checked: await page!
              .deepLocator(resolveSelector(selector!))
              .isChecked(),
          };
        default:
          throw new Error(`Unknown get type: ${what}`);
      }
    }

    // Screenshot
    case "screenshot": {
      const [opts] = args as [
        {
          path?: string;
          fullPage?: boolean;
          type?: string;
          quality?: number;
          clip?: object;
          animations?: string;
          caret?: string;
        },
      ];
      const buffer = await page!.screenshot({
        fullPage: opts?.fullPage,
        type: opts?.type as "png" | "jpeg" | undefined,
        quality: opts?.quality,
        clip: opts?.clip as
          | { x: number; y: number; width: number; height: number }
          | undefined,
        animations: opts?.animations as "disabled" | "allow" | undefined,
        caret: opts?.caret as "hide" | "initial" | undefined,
        timeout: 10000,
      });
      if (opts?.path) {
        await fs.writeFile(opts.path, buffer);
        return { saved: opts.path };
      }
      return { base64: buffer.toString("base64") };
    }

    // Snapshot
    case "snapshot": {
      const [compact] = args as [boolean?];
      const snapshot = await page!.snapshot();

      refMap = {
        xpathMap: snapshot.xpathMap ?? {},
        urlMap: snapshot.urlMap ?? {},
      };

      if (compact) {
        return { tree: snapshot.formattedTree };
      }
      return {
        tree: snapshot.formattedTree,
        xpathMap: snapshot.xpathMap,
        urlMap: snapshot.urlMap,
      };
    }

    // Viewport
    case "viewport": {
      const [width, height, scale] = args as [number, number, number?];
      await page!.setViewportSize(width, height, {
        deviceScaleFactor: scale ?? 1,
      });
      return { viewport: { width, height } };
    }

    // Eval
    case "eval": {
      const [expr] = args as [string];
      const result = await page!.evaluate(expr);
      return { result };
    }
    // Element state
    case "is": {
      const [check, selector] = args as [string, string];
      const locator = page!.deepLocator(resolveSelector(selector));
      switch (check) {
        case "visible":
          return { visible: await locator.isVisible() };
        case "checked":
          return { checked: await locator.isChecked() };
        default:
          throw new Error(`Unknown check: ${check}`);
      }
    }
    // Wait
    case "wait": {
      const [type, arg, opts] = args as [
        string,
        string?,
        { timeout?: number; state?: string }?,
      ];
      switch (type) {
        case "load":
          await page!.waitForLoadState(
            (arg as "load" | "domcontentloaded" | "networkidle") ?? "load",
            opts?.timeout ?? 30000,
          );
          break;
        case "selector":
          await page!.waitForSelector(resolveSelector(arg!), {
            state:
              (opts?.state as "attached" | "detached" | "visible" | "hidden") ??
              "visible",
            timeout: opts?.timeout ?? 30000,
          });
          break;
        case "timeout":
          await page!.waitForTimeout(parseInt(arg!));
          break;
        default:
          throw new Error(`Unknown wait type: ${type}`);
      }
      return { waited: true };
    }

    // Cursor
    case "cursor": {
      await page!.enableCursorOverlay();
      return { cursor: "enabled" };
    }

    // Multi-page
    case "pages": {
      const pages = context.pages();
      return {
        pages: pages.map((p: BrowsePage, i: number) => ({
          index: i,
          url: p.url(),
          targetId: p.targetId(),
        })),
      };
    }
    case "newpage": {
      const [url] = args as [string?];
      const newPage = await context.newPage(url);
      return {
        created: true,
        url: newPage.url(),
        targetId: newPage.targetId(),
      };
    }
    case "tab_switch": {
      const [index] = args as [number];
      const pages = context.pages();
      if (index < 0 || index >= pages.length) {
        throw new Error(
          `Tab index ${index} out of range (0-${pages.length - 1})`,
        );
      }
      context.setActivePage(pages[index]);
      return { switched: true, index, url: pages[index].url() };
    }
    case "tab_close": {
      const [index] = args as [number?];
      const pages = context.pages();
      const targetIndex = index ?? pages.length - 1;
      if (targetIndex < 0 || targetIndex >= pages.length) {
        throw new Error(
          `Tab index ${targetIndex} out of range (0-${pages.length - 1})`,
        );
      }
      if (pages.length === 1) {
        throw new Error("Cannot close the last tab");
      }
      await pages[targetIndex].close();
      return { closed: true, index: targetIndex };
    }

    // Debug: show current ref map
    case "refs": {
      return {
        count: Object.keys(refMap.xpathMap).length,
        xpathMap: refMap.xpathMap,
        urlMap: refMap.urlMap,
      };
    }

    // Network capture commands
    case "network_enable": {
      if (networkEnabled && networkDir) {
        return { enabled: true, path: networkDir, alreadyEnabled: true };
      }

      const session = networkSession || "default";
      networkDir = getNetworkDir(session);
      await fs.mkdir(networkDir, { recursive: true });
      networkCounter = 0;
      pendingRequests.clear();

      const cdpSession = page!.mainFrame().session;
      await cdpSession.send("Network.enable", {
        maxTotalBufferSize: 10000000,
        maxResourceBufferSize: 5000000,
      });

      // Set up CDP event listeners for network capture
      const requestStartTimes = new Map<string, number>();
      const requestDirs = new Map<string, string>();

      cdpSession.on(
        "Network.requestWillBeSent",
        async (params: Protocol.Network.RequestWillBeSentEvent) => {
          if (!networkEnabled || !networkDir) return;

          const request: PendingRequest = {
            id: params.requestId,
            timestamp: new Date().toISOString(),
            method: params.request.method,
            url: params.request.url,
            headers: params.request.headers || {},
            body: params.request.postData || null,
            resourceType: params.type || "Other",
          };

          pendingRequests.set(params.requestId, request);
          requestStartTimes.set(params.requestId, Date.now());

          const requestDir = await writeRequestToFs(request);
          if (requestDir) {
            requestDirs.set(params.requestId, requestDir);
          }
        },
      );

      cdpSession.on(
        "Network.loadingFinished",
        async (params: Protocol.Network.LoadingFinishedEvent) => {
          if (!networkEnabled) return;

          const requestDir = requestDirs.get(params.requestId);
          const pending = pendingRequests.get(params.requestId);
          if (!requestDir || !pending) return;

          const startTime =
            requestStartTimes.get(params.requestId) || Date.now();
          const duration = Date.now() - startTime;

          let body: string | null = null;
          try {
            const result =
              await cdpSession.send<Protocol.Network.GetResponseBodyResponse>(
                "Network.getResponseBody",
                {
                  requestId: params.requestId,
                },
              );
            body = result.body || null;
            if (result.base64Encoded && body) {
              body = `[base64] ${body.slice(0, 100)}...`;
            }
          } catch {
            // Body not available (e.g., for redirects)
          }

          const responseData = {
            id: params.requestId,
            status: 0,
            statusText: "",
            headers: {} as Record<string, string>,
            mimeType: "",
            body,
            duration,
          };

          await writeResponseToFs(requestDir, responseData);

          pendingRequests.delete(params.requestId);
          requestStartTimes.delete(params.requestId);
          requestDirs.delete(params.requestId);
        },
      );

      cdpSession.on(
        "Network.loadingFailed",
        async (params: Protocol.Network.LoadingFailedEvent) => {
          if (!networkEnabled) return;

          const requestDir = requestDirs.get(params.requestId);
          if (!requestDir) return;

          const startTime =
            requestStartTimes.get(params.requestId) || Date.now();
          const duration = Date.now() - startTime;

          const responseData = {
            id: params.requestId,
            status: 0,
            statusText: "Failed",
            headers: {},
            mimeType: "",
            body: null,
            duration,
            error: params.errorText || "Unknown error",
          };

          await writeResponseToFs(requestDir, responseData);

          pendingRequests.delete(params.requestId);
          requestStartTimes.delete(params.requestId);
          requestDirs.delete(params.requestId);
        },
      );

      networkEnabled = true;
      return { enabled: true, path: networkDir };
    }

    case "network_disable": {
      if (!networkEnabled) {
        return { enabled: false, alreadyDisabled: true };
      }

      try {
        await page!.mainFrame().session.send("Network.disable");
      } catch {}

      networkEnabled = false;
      return { enabled: false, path: networkDir };
    }

    case "network_path": {
      if (!networkDir) {
        const session = networkSession || "default";
        return { path: getNetworkDir(session), enabled: false };
      }
      return { path: networkDir, enabled: networkEnabled };
    }

    case "network_clear": {
      if (!networkDir) {
        return { cleared: false, error: "Network capture not enabled" };
      }

      try {
        const entries = await fs.readdir(networkDir, { withFileTypes: true });
        for (const entry of entries) {
          if (entry.isDirectory()) {
            await fs.rm(path.join(networkDir, entry.name), { recursive: true });
          }
        }
        networkCounter = 0;
        pendingRequests.clear();
        return { cleared: true, path: networkDir };
      } catch (err) {
        return {
          cleared: false,
          error: err instanceof Error ? err.message : String(err),
        };
      }
    }

    // Daemon control
    case "stop": {
      process.nextTick(() => {
        process.emit("SIGTERM");
      });
      return { stopping: true };
    }

    default:
      throw new Error(`Unknown command: ${command}`);
  }
}

// ==================== CLIENT ====================

async function sendCommandOnce(
  session: string,
  command: string,
  args: unknown[],
): Promise<unknown> {
  return new Promise((resolve, reject) => {
    const socketPath = getSocketPath(session);
    const client = net.createConnection(socketPath);
    let done = false;

    const timeout = setTimeout(() => {
      cleanup();
      reject(new Error("Command timeout"));
    }, 60000);

    const cleanup = () => {
      if (!done) {
        done = true;
        clearTimeout(timeout);
        rl.close();
        client.destroy();
      }
    };

    const rl = readline.createInterface({ input: client });

    rl.on("line", (line) => {
      const response: DaemonResponse = JSON.parse(line);
      cleanup();
      if (response.success) {
        resolve(response.result);
      } else {
        reject(new Error(response.error));
      }
    });

    rl.on("error", () => {});

    client.on("connect", () => {
      const request: DaemonRequest = { command, args };
      client.write(JSON.stringify(request) + "\n");
    });

    client.on("error", (err) => {
      cleanup();
      reject(new Error(`Connection failed: ${err.message}`));
    });
  });
}

/** Send command with automatic retry and daemon restart on connection failure */
async function sendCommand(
  session: string,
  command: string,
  args: unknown[],
  headless: boolean = false,
): Promise<unknown> {
  const maxRetries = 3;

  for (let attempt = 0; attempt < maxRetries; attempt++) {
    try {
      return await sendCommandOnce(session, command, args);
    } catch (err) {
      const errMsg = err instanceof Error ? err.message : String(err);

      if (command === "stop") {
        throw err;
      }

      const isConnectionError =
        errMsg.includes("ENOENT") ||
        errMsg.includes("ECONNREFUSED") ||
        errMsg.includes("Connection failed");

      if (!isConnectionError) {
        throw err;
      }

      // Attempt 0: Brief wait and retry (socket might be temporarily unavailable)
      if (attempt === 0) {
        await new Promise((r) => setTimeout(r, 200));
        continue;
      }

      // Attempt 1: Try to restart daemon without cleanup
      if (attempt === 1) {
        await ensureDaemon(session, headless);
        continue;
      }

      // Final attempt: Full cleanup and restart
      await killChromeProcesses(session);
      await cleanupStaleFiles(session);
      await ensureDaemon(session, headless);
    }
  }

  throw new Error(
    `Max retries exceeded for command ${command} on session ${session}`,
  );
}

async function stopDaemonAndCleanup(session: string): Promise<void> {
  try {
    await sendCommandOnce(session, "stop", []);
  } catch {
    // Daemon may already be down.
  }
  await new Promise((r) => setTimeout(r, 500));
  await cleanupStaleFiles(session);
}

async function ensureDaemon(session: string, headless: boolean): Promise<void> {
  const wantMode = await getDesiredMode(session);
  assertModeSupported(wantMode);

  if (await isDaemonRunning(session)) {
    // Missing mode file means daemon predates mode support, which was local-only.
    const currentMode = (await readCurrentMode(session)) ?? "local";
    if (currentMode === wantMode) {
      return;
    }
    await stopDaemonAndCleanup(session);
  }

  // Acquire lock before spawning to prevent race conditions
  const locked = await acquireLock(session);
  if (!locked) {
    throw new Error(`Timeout acquiring lock for session ${session}`);
  }

  try {
    // Re-check after acquiring lock (another process may have started daemon)
    if (await isDaemonRunning(session)) {
      const currentMode = (await readCurrentMode(session)) ?? "local";
      if (currentMode === wantMode) {
        return;
      }
      await stopDaemonAndCleanup(session);
    }

    const args = ["--session", session, "daemon"];
    if (headless) args.push("--headless");

    const child = spawn(process.argv[0], [process.argv[1], ...args], {
      detached: true,
      // Avoid piping stdout for detached daemon startup. Deep-locator internals
      // can log via console fallback, and writing to a broken pipe crashes daemon.
      stdio: ["ignore", "ignore", "ignore"],
    });
    child.unref();

    await new Promise<void>((resolve, reject) => {
      let settled = false;

      const finish = (err?: Error) => {
        if (settled) return;
        settled = true;
        clearTimeout(timeout);
        child.off("error", onError);
        child.off("exit", onExit);
        if (err) reject(err);
        else resolve();
      };

      const onError = (err: Error) => {
        finish(err);
      };

      const onExit = (code: number | null, signal: string | null) => {
        finish(
          new Error(
            `Daemon exited before ready (code=${code ?? "null"}, signal=${signal ?? "null"})`,
          ),
        );
      };

      const timeout = setTimeout(() => {
        finish(new Error("Timeout waiting for daemon to start"));
      }, 30000);

      child.once("error", onError);
      child.once("exit", onExit);

      // Readiness is determined by socket connectivity, not daemon stdout.
      waitForSocketReady(getSocketPath(session), 28000)
        .then(() => finish())
        .catch((err) =>
          finish(err instanceof Error ? err : new Error(String(err))),
        );
    });
  } finally {
    await releaseLock(session);
  }
}

// ==================== CLI INTERFACE ====================

interface GlobalOpts {
  ws?: string;
  headless?: boolean;
  headed?: boolean;
  json?: boolean;
  session?: string;
}

function getSession(opts: GlobalOpts): string {
  return opts.session ?? process.env.BROWSE_SESSION ?? "default";
}

function isHeadless(opts: GlobalOpts): boolean {
  return opts.headless === true && opts.headed !== true;
}

function output(data: unknown, json: boolean): void {
  if (json) {
    console.log(JSON.stringify(data, null, 2));
  } else if (typeof data === "string") {
    console.log(data);
  } else {
    console.log(JSON.stringify(data, null, 2));
  }
}

async function runCommand(command: string, args: unknown[]): Promise<unknown> {
  const opts = program.opts<GlobalOpts>();
  const session = getSession(opts);
  const headless = isHeadless(opts);
  // If --ws provided, bypass daemon and connect directly
  if (opts.ws) {
    const stagehand = new Stagehand({
      env: "LOCAL",
      verbose: 0,
      disablePino: true,
      localBrowserLaunchOptions: {
        cdpUrl: opts.ws,
      },
    });
    await stagehand.init();
    try {
      return await executeCommand(stagehand.context, command, args);
    } finally {
      await stagehand.close();
    }
  }

  await ensureDaemon(session, headless);
  return sendCommand(session, command, args, headless);
}

program
  .name("browse")
  .description("Browser automation CLI for AI agents")
  .version(VERSION)
  .option(
    "--ws <url>",
    "CDP WebSocket URL (bypasses daemon, direct connection)",
  )
  .option("--headless", "Run Chrome in headless mode")
  .option("--headed", "Run Chrome with visible window (default)")
  .option("--json", "Output as JSON", false)
  .option(
    "--session <name>",
    "Session name for multiple browsers (or use BROWSE_SESSION env var)",
  );

// ==================== DAEMON COMMANDS ====================

program
  .command("start")
  .description("Start browser daemon (auto-started by other commands)")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    const session = getSession(opts);
    if (await isDaemonRunning(session)) {
      console.log(JSON.stringify({ status: "already running", session }));
      return;
    }
    await ensureDaemon(session, isHeadless(opts));
    console.log(JSON.stringify({ status: "started", session }));
  });

program
  .command("stop")
  .description("Stop browser daemon")
  .option("--force", "Force kill Chrome processes if daemon is unresponsive")
  .action(async (cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    const session = getSession(opts);
    // Clear any explicit env override so next start uses env var detection
    try {
      await fs.unlink(getModeOverridePath(session));
    } catch {}
    try {
      await sendCommand(session, "stop", []);
      console.log(JSON.stringify({ status: "stopped", session }));
    } catch {
      if (cmdOpts.force) {
        await killChromeProcesses(session);
        await cleanupStaleFiles(session);
        console.log(JSON.stringify({ status: "force stopped", session }));
      } else {
        console.log(JSON.stringify({ status: "not running", session }));
      }
    }
  });

program
  .command("status")
  .description("Check daemon status")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    const session = getSession(opts);
    const running = await isDaemonRunning(session);
    let wsUrl = null;
    let mode: BrowseMode | null = null;
    if (running) {
      try {
        wsUrl = await fs.readFile(getWsPath(session), "utf-8");
      } catch {}
      mode = await readCurrentMode(session);
    }
    console.log(JSON.stringify({ running, session, wsUrl, mode }));
  });

program
  .command("env [target]")
  .description("Show or switch browser environment (local | remote)")
  .action(async (target?: string) => {
    const opts = program.opts<GlobalOpts>();
    const session = getSession(opts);

    if (!target) {
      let mode: string | null = null;
      const desiredMode = await getDesiredMode(session);
      if (await isDaemonRunning(session)) {
        mode = toModeTarget((await readCurrentMode(session)) ?? desiredMode);
      }
      console.log(
        JSON.stringify({
          mode: mode ?? "not running",
          desired: toModeTarget(desiredMode),
          session,
        }),
      );
      return;
    }

    const modeMap: Record<string, BrowseMode> = {
      local: "local",
      remote: "browserbase",
    };
    const mapped = modeMap[target];
    if (!mapped) {
      console.error("Usage: browse env [local|remote]");
      process.exit(1);
    }

    try {
      assertModeSupported(mapped);
    } catch (err) {
      console.error(err instanceof Error ? err.message : String(err));
      process.exit(1);
    }

    await fs.writeFile(getModeOverridePath(session), mapped);

    if (await isDaemonRunning(session)) {
      const currentMode = (await readCurrentMode(session)) ?? "local";
      if (currentMode === mapped) {
        console.log(
          JSON.stringify({
            mode: toModeTarget(mapped),
            session,
            restarted: false,
          }),
        );
        return;
      }
      await stopDaemonAndCleanup(session);
    }

    await ensureDaemon(session, isHeadless(opts));

    console.log(
      JSON.stringify({
        mode: toModeTarget(mapped),
        session,
        restarted: true,
      }),
    );
  });

program
  .command("refs")
  .description("Show cached ref map from last snapshot")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("refs", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("daemon")
  .description("Run as daemon (internal use)")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    await runDaemon(getSession(opts), isHeadless(opts));
  });

// ==================== NAVIGATION ====================

program
  .command("open <url>")
  .alias("goto")
  .description("Navigate to URL")
  .option(
    "--wait <state>",
    "Wait state: load, domcontentloaded, networkidle",
    "load",
  )
  .option("-t, --timeout <ms>", "Navigation timeout in milliseconds", "30000")
  .option(
    "--context-id <id>",
    "Browserbase context ID to load browser state (remote mode only)",
  )
  .option(
    "--persist",
    "Persist context changes back after session ends (requires --context-id)",
    false,
  )
  .action(async (url: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      // Validate context flags
      if (cmdOpts.persist && !cmdOpts.contextId) {
        console.error("Error: --persist requires --context-id");
        process.exit(1);
      }

      const session = getSession(opts);

      if (cmdOpts.contextId) {
        // Contexts only work with Browserbase remote sessions
        const desiredMode = await getDesiredMode(session);
        if (desiredMode === "local") {
          console.error(
            "Error: --context-id is only supported in remote mode. Run `browse env remote` first.",
          );
          process.exit(1);
        }

        const newConfig = JSON.stringify({
          id: cmdOpts.contextId,
          persist: cmdOpts.persist ?? false,
        });

        // If daemon is already running with a different context, restart it
        // (context is baked into the Browserbase session at creation time)
        if (await isDaemonRunning(session)) {
          let currentConfig: string | null = null;
          try {
            currentConfig = await fs.readFile(getContextPath(session), "utf-8");
          } catch {}
          if (currentConfig !== newConfig) {
            await stopDaemonAndCleanup(session);
          }
        }

        await fs.writeFile(getContextPath(session), newConfig);
      } else {
        // No --context-id: clear any stale context file so the daemon starts clean
        try {
          await fs.unlink(getContextPath(session));
        } catch {}
      }

      const result = await runCommand("open", [
        url,
        cmdOpts.wait,
        parseInt(cmdOpts.timeout),
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("reload")
  .description("Reload current page")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("reload", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("back")
  .description("Go back in history")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("back", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("forward")
  .description("Go forward in history")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("forward", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== CLICK ACTIONS ====================

program
  .command("click <ref>")
  .description("Click element by ref (e.g., @0-5, 0-5, or CSS/XPath selector)")
  .option("-b, --button <btn>", "Mouse button: left, right, middle", "left")
  .option("-c, --count <n>", "Click count", "1")
  .option(
    "-f, --force",
    "Force click even if element has no layout (uses synthetic event)",
  )
  .action(async (ref: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("click", [
        ref,
        {
          button: cmdOpts.button,
          clickCount: parseInt(cmdOpts.count),
          force: cmdOpts.force,
        },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("click_xy <x> <y>")
  .description("Click at exact coordinates")
  .option("-b, --button <btn>", "Mouse button: left, right, middle", "left")
  .option("-c, --count <n>", "Click count", "1")
  .option("--xpath", "Return XPath of clicked element")
  .action(async (x: string, y: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("click_xy", [
        parseFloat(x),
        parseFloat(y),
        {
          button: cmdOpts.button,
          clickCount: parseInt(cmdOpts.count),
          returnXPath: cmdOpts.xpath,
        },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== COORDINATE ACTIONS ====================

program
  .command("hover <x> <y>")
  .description("Hover at coordinates")
  .option("--xpath", "Return XPath of hovered element")
  .action(async (x: string, y: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("hover", [
        parseFloat(x),
        parseFloat(y),
        { returnXPath: cmdOpts.xpath },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("scroll <x> <y> <deltaX> <deltaY>")
  .description("Scroll at coordinates")
  .option("--xpath", "Return XPath of scrolled element")
  .action(async (x: string, y: string, dx: string, dy: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("scroll", [
        parseFloat(x),
        parseFloat(y),
        parseFloat(dx),
        parseFloat(dy),
        { returnXPath: cmdOpts.xpath },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("drag <fromX> <fromY> <toX> <toY>")
  .description("Drag from one point to another")
  .option("-b, --button <btn>", "Mouse button: left, right, middle", "left")
  .option("--steps <n>", "Number of intermediate drag steps", "10")
  .option("--delay <ms>", "Delay between drag steps in milliseconds", "0")
  .option("--xpath", "Return XPath of source and target elements")
  .action(async (fx: string, fy: string, tx: string, ty: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("drag", [
        parseFloat(fx),
        parseFloat(fy),
        parseFloat(tx),
        parseFloat(ty),
        {
          button: cmdOpts.button,
          steps: parseInt(cmdOpts.steps, 10),
          delay: parseInt(cmdOpts.delay, 10),
          returnXPath: cmdOpts.xpath,
        },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== KEYBOARD ====================

program
  .command("type <text>")
  .description("Type text")
  .option("-d, --delay <ms>", "Delay between keystrokes")
  .option("--mistakes", "Enable human-like typing with mistakes")
  .action(async (text: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("type", [
        text,
        {
          delay: cmdOpts.delay ? parseInt(cmdOpts.delay) : undefined,
          mistakes: cmdOpts.mistakes,
        },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("press <key>")
  .alias("key")
  .description("Press key (e.g., Enter, Tab, Escape, Cmd+A)")
  .action(async (key: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("press", [key]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== ELEMENT ACTIONS ====================

program
  .command("fill <selector> <value>")
  .description("Fill input element (presses Enter by default)")
  .option("--no-press-enter", "Don't press Enter after filling")
  .action(async (selector: string, value: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const pressEnter = cmdOpts.pressEnter !== false;
      const result = await runCommand("fill", [
        selector,
        value,
        { pressEnter },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("select <selector> <values...>")
  .description("Select option(s)")
  .action(async (selector: string, values: string[]) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("select", [selector, values]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("highlight <selector>")
  .description("Highlight element")
  .option("-d, --duration <ms>", "Duration", "2000")
  .action(async (selector: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("highlight", [
        selector,
        parseInt(cmdOpts.duration),
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== PAGE INFO ====================

program
  .command("get <what> [selector]")
  .description(
    "Get page info: url, title, text, html, value, box, visible, checked",
  )
  .action(async (what: string, selector?: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("get", [what, selector]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== SCREENSHOT ====================

program
  .command("screenshot [path]")
  .description("Take screenshot")
  .option("-f, --full-page", "Full page screenshot")
  .option("-t, --type <type>", "Image type: png, jpeg", "png")
  .option("-q, --quality <n>", "JPEG quality (0-100)")
  .option("--clip <json>", "Clip region as JSON")
  .option("--no-animations", "Disable animations")
  .option("--hide-caret", "Hide text caret")
  .action(async (filePath: string | undefined, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("screenshot", [
        {
          path: filePath,
          fullPage: cmdOpts.fullPage,
          type: cmdOpts.type,
          quality: cmdOpts.quality ? parseInt(cmdOpts.quality) : undefined,
          clip: cmdOpts.clip ? JSON.parse(cmdOpts.clip) : undefined,
          animations: cmdOpts.animations === false ? "disabled" : "allow",
          caret: cmdOpts.hideCaret ? "hide" : "initial",
        },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== SNAPSHOT ====================

program
  .command("snapshot")
  .description("Get accessibility tree snapshot")
  .option("-c, --compact", "Output tree only (no xpath map)")
  .action(async (cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = (await runCommand("snapshot", [cmdOpts.compact])) as {
        tree: string;
        xpathMap?: Record<string, string>;
        urlMap?: Record<string, string>;
      };
      if (cmdOpts.compact && !opts.json) {
        console.log(result.tree);
      } else {
        output(result, opts.json ?? false);
      }
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== VIEWPORT ====================

program
  .command("viewport <width> <height>")
  .description("Set viewport size")
  .option("-s, --scale <n>", "Device scale factor", "1")
  .action(async (w: string, h: string, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("viewport", [
        parseInt(w),
        parseInt(h),
        parseFloat(cmdOpts.scale),
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== EVAL ====================

program
  .command("eval <expression>")
  .description("Evaluate JavaScript in page")
  .action(async (expr: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("eval", [expr]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== WAIT ====================

program
  .command("wait <type> [arg]")
  .description("Wait for: load, selector, timeout")
  .option("-t, --timeout <ms>", "Timeout", "30000")
  .option(
    "-s, --state <state>",
    "Element state: visible, hidden, attached, detached",
    "visible",
  )
  .action(async (type: string, arg: string | undefined, cmdOpts) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("wait", [
        type,
        arg,
        { timeout: parseInt(cmdOpts.timeout), state: cmdOpts.state },
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== ELEMENT STATE CHECKS ====================

program
  .command("is <check> <selector>")
  .description("Check element state: visible, checked")
  .action(async (check: string, selector: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("is", [check, selector]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== CURSOR ====================

program
  .command("cursor")
  .description("Enable visual cursor overlay")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("cursor", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== MULTI-PAGE ====================

program
  .command("pages")
  .description("List all open pages")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("pages", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("newpage [url]")
  .description("Create a new page/tab")
  .action(async (url?: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("newpage", [url]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("tab_switch <index>")
  .alias("switch")
  .description("Switch to tab by index")
  .action(async (index: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("tab_switch", [parseInt(index)]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

program
  .command("tab_close [index]")
  .alias("close")
  .description("Close tab by index (defaults to last tab)")
  .action(async (index?: string) => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("tab_close", [
        index ? parseInt(index) : undefined,
      ]);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== NETWORK CAPTURE ====================

const networkCmd = program
  .command("network")
  .description(
    "Network capture commands (writes to filesystem for agent inspection)",
  );

networkCmd
  .command("on")
  .description("Enable network capture (creates temp directory for requests)")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("network_enable", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

networkCmd
  .command("off")
  .description("Disable network capture")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("network_disable", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

networkCmd
  .command("path")
  .description("Get network capture directory path")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("network_path", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

networkCmd
  .command("clear")
  .description("Clear all captured requests")
  .action(async () => {
    const opts = program.opts<GlobalOpts>();
    try {
      const result = await runCommand("network_clear", []);
      output(result, opts.json ?? false);
    } catch (e) {
      console.error("Error:", e instanceof Error ? e.message : e);
      process.exit(1);
    }
  });

// ==================== RUN ====================

program.parse();


================================================
FILE: packages/cli/tests/cli.test.ts
================================================
/**
 * Browse CLI Tests
 *
 * Comprehensive test suite covering:
 * - Daemon lifecycle
 * - Navigation commands
 * - Actions (click, type, fill)
 * - Information retrieval (snapshot, screenshot, get)
 * - Multi-tab operations
 * - Network capture
 * - Error handling
 */

import { describe, it, expect, beforeAll, afterAll, afterEach } from "vitest";
import { exec } from "child_process";
import * as fs from "fs/promises";
import * as path from "path";
import * as os from "os";

// CLI executable path - use the built dist for testing (daemon spawns via process.argv[0])
const CLI_PATH = path.join(__dirname, "../dist/index.js");

// Test session name to avoid conflicts
const TEST_SESSION = `test-${Date.now()}`;

// Helper to run CLI commands
async function browse(
  args: string,
  options: { timeout?: number; session?: string } = {},
): Promise<{ stdout: string; stderr: string; exitCode: number }> {
  const session = options.session ?? TEST_SESSION;
  const timeout = options.timeout ?? 30000;

  return new Promise((resolve) => {
    const fullArgs = `node ${CLI_PATH} --headless --session ${session} ${args}`;
    exec(fullArgs, { timeout }, (error, stdout, stderr) => {
      resolve({
        stdout: stdout.trim(),
        stderr: stderr.trim(),
        exitCode: error?.code ?? 0,
      });
    });
  });
}

// Helper to parse JSON output
function parseJson<T = Record<string, unknown>>(output: string): T {
  try {
    return JSON.parse(output) as T;
  } catch {
    throw new Error(`Failed to parse JSON: ${output}`);
  }
}

// Cleanup helper
async function cleanupSession(session: string): Promise<void> {
  const tmpDir = os.tmpdir();
  const patterns = [
    `browse-${session}.sock`,
    `browse-${session}.pid`,
    `browse-${session}.ws`,
    `browse-${session}.chrome.pid`,
    `browse-${session}.mode`,
    `browse-${session}.mode-override`,
  ];

  for (const pattern of patterns) {
    try {
      await fs.unlink(path.join(tmpDir, pattern));
    } catch {}
  }

  // Clean network dir
  try {
    await fs.rm(path.join(tmpDir, `browse-${session}-network`), {
      recursive: true,
    });
  } catch {}
}

describe("Browse CLI", () => {
  // Cleanup before and after all tests
  beforeAll(async () => {
    await cleanupSession(TEST_SESSION);
  });

  afterAll(async () => {
    // Stop daemon if running
    await browse("stop --force");
    await cleanupSession(TEST_SESSION);
  });

  describe("Daemon Lifecycle", () => {
    afterEach(async () => {
      await browse("stop --force");
    });

    it("should start daemon on first command", async () => {
      const result = await browse("status");
      const data = parseJson(result.stdout);
      // Initially not running
      expect(data.running).toBe(false);

      // Start via command
      const startResult = await browse("start");
      expect(startResult.stdout).toContain("started");

      // Now should be running
      const statusResult = await browse("status");
      const statusData = parseJson(statusResult.stdout);
      expect(statusData.running).toBe(true);
    });

    it("should stop daemon gracefully", async () => {
      await browse("start");

      const stopResult = await browse("stop");
      const data = parseJson(stopResult.stdout);
      expect(data.status).toBe("stopped");

      // Verify stopped
      const statusResult = await browse("status");
      const statusData = parseJson(statusResult.stdout);
      expect(statusData.running).toBe(false);
    });

    it("should force stop unresponsive daemon", async () => {
      await browse("start");

      const result = await browse("stop --force");
      const data = parseJson(result.stdout);
      expect(["stopped", "force stopped", "not running"]).toContain(
        data.status,
      );
    });

    it("should support multiple sessions", async () => {
      const session1 = `${TEST_SESSION}-1`;
      const session2 = `${TEST_SESSION}-2`;

      try {
        // Start both sessions
        await browse("start", { session: session1 });
        await browse("start", { session: session2 });

        // Both should be running
        const status1 = parseJson(
          (await browse("status", { session: session1 })).stdout,
        );
        const status2 = parseJson(
          (await browse("status", { session: session2 })).stdout,
        );

        expect(status1.running).toBe(true);
        expect(status2.running).toBe(true);
      } finally {
        await browse("stop --force", { session: session1 });
        await browse("stop --force", { session: session2 });
        await cleanupSession(session1);
        await cleanupSession(session2);
      }
    });
  });

  describe("Navigation", () => {
    beforeAll(async () => {
      await browse("start");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should navigate to URL", async () => {
      const result = await browse("open https://example.com");
      const data = parseJson(result.stdout);
      expect(data.url).toContain("example.com");
    });

    it("should get current URL", async () => {
      await browse("open https://example.com");
      const result = await browse("get url");
      const data = parseJson(result.stdout);
      expect(data.url).toContain("example.com");
    });

    it("should get page title", async () => {
      await browse("open https://example.com");
      const result = await browse("get title");
      const data = parseJson(result.stdout);
      expect(data.title).toBeTruthy();
    });

    it("should reload page", async () => {
      await browse("open https://example.com");
      const result = await browse("reload");
      const data = parseJson(result.stdout);
      expect(data.url).toContain("example.com");
    });
  });

  describe("Snapshot", () => {
    beforeAll(async () => {
      await browse("start");
      await browse("open https://example.com");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should take snapshot with refs", async () => {
      const result = await browse("snapshot");
      const data = parseJson(result.stdout);

      expect(data.tree).toBeTruthy();
      expect(data.xpathMap).toBeTruthy();
      expect(typeof data.xpathMap).toBe("object");
    });

    it("should take compact snapshot", async () => {
      const result = await browse("snapshot -c");
      // Compact mode outputs tree directly (not JSON when not --json)
      expect(result.stdout).toContain("RootWebArea");
    });

    it("should populate refs for subsequent commands", async () => {
      await browse("snapshot");
      const refsResult = await browse("refs");
      const data = parseJson(refsResult.stdout);

      expect(data.count).toBeGreaterThan(0);
      expect(data.xpathMap).toBeTruthy();
    });
  });

  describe("Screenshot", () => {
    const screenshotPath = path.join(
      os.tmpdir(),
      `browse-test-${Date.now()}.png`,
    );

    beforeAll(async () => {
      await browse("start");
      await browse("open https://example.com");
    });

    afterAll(async () => {
      await browse("stop --force");
      try {
        await fs.unlink(screenshotPath);
      } catch {}
    });

    it("should take screenshot and return base64", async () => {
      const result = await browse("screenshot");
      const data = parseJson<{ base64: string }>(result.stdout);
      expect(data.base64).toBeTruthy();
      expect(data.base64.length).toBeGreaterThan(100);
    });

    it("should save screenshot to file", async () => {
      const result = await browse(`screenshot ${screenshotPath}`);
      const data = parseJson(result.stdout);
      expect(data.saved).toBe(screenshotPath);

      // Verify file exists
      const stat = await fs.stat(screenshotPath);
      expect(stat.size).toBeGreaterThan(0);
    });
  });

  describe("Actions", () => {
    beforeAll(async () => {
      await browse("start");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should click by coordinates", async () => {
      await browse("open https://example.com");
      const result = await browse("click_xy 100 100");
      const data = parseJson(result.stdout);
      expect(data.clicked).toBe(true);
    });

    it("should click by ref after snapshot", async () => {
      await browse("open https://example.com");
      await browse("snapshot");

      // Find a clickable ref
      const refsResult = await browse("refs");
      const refs = parseJson<{
        count: number;
        xpathMap: Record<string, string>;
      }>(refsResult.stdout);

      if (refs.count > 0) {
        const firstRef = Object.keys(refs.xpathMap)[0];
        const result = await browse(`click @${firstRef}`);
        const data = parseJson(result.stdout);
        expect(data.clicked).toBe(true);
      }
    });

    it("should type text", async () => {
      await browse("open https://example.com");
      const result = await browse('type "Hello World"');
      const data = parseJson(result.stdout);
      expect(data.typed).toBe(true);
    });

    it("should press keys", async () => {
      await browse("open https://example.com");
      const result = await browse("press Tab");
      const data = parseJson(result.stdout);
      expect(data.pressed).toBe("Tab");
    });

    it("should hover at coordinates", async () => {
      await browse("open https://example.com");
      const result = await browse("hover 200 200");
      const data = parseJson(result.stdout);
      expect(data.hovered).toBe(true);
    });

    it("should scroll", async () => {
      await browse("open https://example.com");
      const result = await browse("scroll 400 400 0 100");
      const data = parseJson(result.stdout);
      expect(data.scrolled).toBe(true);
    });

    it("should drag and drop between coordinates", async () => {
      const html = `<!doctype html><html><body style="margin:0"><div id="source" draggable="true" style="position:absolute;left:40px;top:40px;width:80px;height:80px;background:#e66;cursor:move"></div><div id="target" style="position:absolute;left:250px;top:40px;width:120px;height:120px;background:#ddd"></div><div id="status" style="position:absolute;left:40px;top:180px">Not dropped</div><script>const source=document.getElementById('source');const target=document.getElementById('target');const status=document.getElementById('status');source.addEventListener('dragstart',e=>{e.dataTransfer.setData('text/plain','dragged')});target.addEventListener('dragover',e=>{e.preventDefault()});target.addEventListener('drop',e=>{e.preventDefault();status.textContent='Dropped'})</script></body></html>`;
      const dataUrl = `data:text/html,${encodeURIComponent(html)}`;

      await browse(`open "${dataUrl}"`);
      const dragResult = await browse("drag 80 80 310 100 --steps 8 --xpath");
      const dragData = parseJson(dragResult.stdout);
      expect(dragData.dragged).toBe(true);
      expect(typeof dragData.fromXpath).toBe("string");
      expect(typeof dragData.toXpath).toBe("string");

      const statusResult = await browse(
        'eval "document.getElementById(\\"status\\").textContent"',
      );
      const statusData = parseJson(statusResult.stdout);
      expect(statusData.result).toBe("Dropped");
    });
  });

  describe("Multi-Tab", () => {
    beforeAll(async () => {
      await browse("start");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should list pages", async () => {
      await browse("open https://example.com");
      const result = await browse("pages");
      const data = parseJson<{ pages: { index: number; url: string }[] }>(
        result.stdout,
      );

      expect(data.pages).toBeInstanceOf(Array);
      expect(data.pages.length).toBeGreaterThan(0);
      expect(data.pages[0]).toHaveProperty("index");
      expect(data.pages[0]).toHaveProperty("url");
    });

    it("should create new page", async () => {
      const beforeResult = await browse("pages");
      const beforeData = parseJson<{ pages: unknown[] }>(beforeResult.stdout);
      const beforeCount = beforeData.pages.length;

      const newResult = await browse("newpage https://github.com");
      const newData = parseJson(newResult.stdout);
      expect(newData.created).toBe(true);

      const afterResult = await browse("pages");
      const afterData = parseJson<{ pages: unknown[] }>(afterResult.stdout);
      expect(afterData.pages.length).toBe(beforeCount + 1);
    });

    it("should switch tabs", async () => {
      await browse("open https://example.com");
      await browse("newpage https://github.com");

      const result = await browse("tab_switch 0");
      const data = parseJson(result.stdout);
      expect(data.switched).toBe(true);
      expect(data.index).toBe(0);
    });

    it("should close tab", async () => {
      await browse("open https://example.com");
      await browse("newpage https://github.com");

      const beforeResult = await browse("pages");
      const beforeCount = parseJson<{ pages: unknown[] }>(beforeResult.stdout)
        .pages.length;

      const closeResult = await browse("tab_close");
      const closeData = parseJson(closeResult.stdout);
      expect(closeData.closed).toBe(true);

      const afterResult = await browse("pages");
      const afterCount = parseJson<{ pages: unknown[] }>(afterResult.stdout)
        .pages.length;
      expect(afterCount).toBe(beforeCount - 1);
    });
  });

  describe("Waiting", () => {
    beforeAll(async () => {
      await browse("start");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should wait for timeout", async () => {
      await browse("open https://example.com");
      const start = Date.now();
      const result = await browse("wait timeout 500");
      const elapsed = Date.now() - start;

      const data = parseJson(result.stdout);
      expect(data.waited).toBe(true);
      expect(elapsed).toBeGreaterThanOrEqual(450);
    });

    it("should wait for load state", async () => {
      await browse("open https://example.com");
      const result = await browse("wait load");
      const data = parseJson(result.stdout);
      expect(data.waited).toBe(true);
    });
  });

  describe("Network Capture", () => {
    beforeAll(async () => {
      await browse("start");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should enable network capture", async () => {
      const result = await browse("network on");
      const data = parseJson(result.stdout);
      expect(data.enabled).toBe(true);
      expect(data.path).toBeTruthy();
    });

    it("should return network path", async () => {
      await browse("network on");
      const result = await browse("network path");
      const data = parseJson(result.stdout);
      expect(data.path).toBeTruthy();
      expect(data.enabled).toBe(true);
    });

    it("should capture requests to filesystem", async () => {
      await browse("network on");
      const pathResult = await browse("network path");
      const networkDir = parseJson<{ path: string }>(pathResult.stdout).path;

      // Navigate to trigger requests
      await browse("open https://example.com");

      // Wait for requests to be written
      await browse("wait timeout 1000");

      // Check if directory has content
      try {
        const entries = await fs.readdir(networkDir);
        // May or may not have captured requests depending on timing
        expect(Array.isArray(entries)).toBe(true);
      } catch {
        // Directory may not exist if no requests captured
      }
    });

    it("should disable network capture", async () => {
      await browse("network on");
      const result = await browse("network off");
      const data = parseJson(result.stdout);
      expect(data.enabled).toBe(false);
    });

    it("should clear network captures", async () => {
      await browse("network on");
      await browse("open https://example.com");
      await browse("wait timeout 500");

      const result = await browse("network clear");
      const data = parseJson(result.stdout);
      expect(data.cleared).toBe(true);
    });
  });

  describe("Viewport", () => {
    beforeAll(async () => {
      await browse("start");
      await browse("open https://example.com");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should set viewport size", async () => {
      const result = await browse("viewport 1920 1080");
      const data = parseJson<{ viewport: { width: number; height: number } }>(
        result.stdout,
      );
      expect(data.viewport.width).toBe(1920);
      expect(data.viewport.height).toBe(1080);
    });
  });

  describe("Eval", () => {
    beforeAll(async () => {
      await browse("start");
      await browse("open https://example.com");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should evaluate JavaScript", async () => {
      const result = await browse('eval "document.title"');
      const data = parseJson(result.stdout);
      expect(data.result).toBeTruthy();
    });

    it("should return computed values", async () => {
      const result = await browse('eval "1 + 1"');
      const data = parseJson(result.stdout);
      expect(data.result).toBe(2);
    });
  });

  describe("Error Handling", () => {
    beforeAll(async () => {
      await browse("start");
    });

    afterAll(async () => {
      await browse("stop --force");
    });

    it("should error on invalid ref", async () => {
      await browse("open https://example.com");
      // Don't run snapshot, so refs are empty
      const result = await browse("click @99-99");
      expect(result.stderr).toContain("Error");
    });

    it("should error on unknown command", async () => {
      const result = await browse("nonexistent");
      expect(result.exitCode).not.toBe(0);
    });
  });
});


================================================
FILE: packages/cli/tests/mode.test.ts
================================================
import { describe, it, expect, afterEach } from "vitest";
import { exec } from "child_process";
import { promises as fs } from "fs";
import * as path from "path";
import * as os from "os";

const CLI_PATH = path.join(__dirname, "../dist/index.js");
const TEST_SESSION = `env-test-${Date.now()}`;

async function browse(
  args: string,
  options: { timeout?: number; env?: NodeJS.ProcessEnv } = {},
): Promise<{ stdout: string; stderr: string; exitCode: number }> {
  const timeout = options.timeout ?? 30000;
  const env = { ...process.env, ...options.env };

  return new Promise((resolve) => {
    const fullArgs = `node ${CLI_PATH} --headless --session ${TEST_SESSION} ${args}`;
    exec(fullArgs, { timeout, env }, (error, stdout, stderr) => {
      resolve({
        stdout: stdout.trim(),
        stderr: stderr.trim(),
        exitCode: error?.code ?? 0,
      });
    });
  });
}

function parseJson<T = Record<string, unknown>>(output: string): T {
  try {
    return JSON.parse(output) as T;
  } catch {
    throw new Error(`Failed to parse JSON: ${output}`);
  }
}

async function cleanupSession(session: string): Promise<void> {
  const tmpDir = os.tmpdir();
  const patterns = [
    `browse-${session}.sock`,
    `browse-${session}.pid`,
    `browse-${session}.ws`,
    `browse-${session}.chrome.pid`,
    `browse-${session}.mode`,
    `browse-${session}.mode-override`,
  ];

  for (const pattern of patterns) {
    try {
      await fs.unlink(path.join(tmpDir, pattern));
    } catch {
      // Ignore missing files.
    }
  }

  try {
    await fs.rm(path.join(tmpDir, `browse-${session}-network`), {
      recursive: true,
    });
  } catch {
    // Ignore missing directory.
  }
}

describe("Browse CLI env command", () => {
  afterEach(async () => {
    await browse("stop --force");
    await cleanupSession(TEST_SESSION);
  });

  it("shows desired env even when daemon is not running", async () => {
    const result = await browse("env");
    expect(result.exitCode).toBe(0);

    const data = parseJson(result.stdout);
    expect(data.mode).toBe("not running");
    expect(["local", "remote"]).toContain(data.desired);
  });

  it("rejects unsupported env target", async () => {
    const result = await browse("env invalid-target");
    expect(result.exitCode).not.toBe(0);
    expect(result.stderr).toContain("Usage: browse env [local|remote]");
  });

  it("rejects remote env without Browserbase credentials", async () => {
    const result = await browse("env remote", {
      env: {
        ...process.env,
        BROWSERBASE_API_KEY: "",
      },
    });
    expect(result.exitCode).not.toBe(0);
    expect(result.stderr).toContain("Remote mode requires BROWSERBASE_API_KEY");
  });
});


================================================
FILE: packages/cli/tsconfig.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "moduleResolution": "bundler",
    "strict": true,
    "outDir": "./dist",
    "rootDir": ".",
    "types": ["node"]
  },
  "include": ["src/**/*", "tests/**/*"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: packages/cli/tsup.config.ts
================================================
import { defineConfig } from "tsup";

export default defineConfig({
  entry: ["src/index.ts"],
  format: ["cjs"],
  target: "node20",
  clean: true,
  shims: true,
  banner: {
    js: "#!/usr/bin/env node",
  },
  // Bundle everything possible, only externalize what truly can't be bundled
  noExternal: [/@browserbasehq\/stagehand/],
  external: [
    // Browser automation - user must install playwright to use the CLI
    "playwright",
    "playwright-core",
    // CJS packages with dynamic requires that break in ESM bundles
    "pino",
    "pino-pretty",
    "ws",
    "dotenv",
  ],
});


================================================
FILE: packages/cli/vitest.config.ts
================================================
import { defineConfig } from "vitest/config";

export default defineConfig({
  test: {
    globals: true,
    testTimeout: 60000,
    hookTimeout: 60000,
    include: ["tests/**/*.test.ts"],
    // Run tests sequentially since they share browser state
    pool: "forks",
    poolOptions: {
      forks: {
        singleFork: true,
      },
    },
  },
});


================================================
FILE: packages/core/CHANGELOG.md
================================================
# @browserbasehq/stagehand

## 3.2.0

### Minor Changes

- [#1779](https://github.com/browserbase/stagehand/pull/1779) [`2f43ffa`](https://github.com/browserbase/stagehand/commit/2f43ffac11778152d17e4c44405770cc32c3ec8c) Thanks [@shrey150](https://github.com/shrey150)! - feat: add `cdpHeaders` option to `localBrowserLaunchOptions` for passing custom HTTP headers when connecting to an existing browser via CDP URL

- [#1834](https://github.com/browserbase/stagehand/pull/1834) [`63ee247`](https://github.com/browserbase/stagehand/commit/63ee247ac6bf2992046d4f6b2759f46b15643e36) Thanks [@tkattkat](https://github.com/tkattkat)! - Update stagehand agents search tool

- [#1774](https://github.com/browserbase/stagehand/pull/1774) [`521a10e`](https://github.com/browserbase/stagehand/commit/521a10e3698fc5631e219947bc90dad0f8bddaa8) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add new page.setExtraHTTPHeaders() method

### Patch Changes

- [#1759](https://github.com/browserbase/stagehand/pull/1759) [`505e8c6`](https://github.com/browserbase/stagehand/commit/505e8c6736f3706328dbc8df670c49a018058388) Thanks [@shrey150](https://github.com/shrey150)! - Add bedrock to the provider enum in model configuration schemas and regenerate OpenAPI spec.

- [#1814](https://github.com/browserbase/stagehand/pull/1814) [`7dc35f5`](https://github.com/browserbase/stagehand/commit/7dc35f5e25689e6518d68b25ef71536d2781c8aa) Thanks [@tkattkat](https://github.com/tkattkat)! - Change usage of openai provider in agent to default to store:false

- [#1846](https://github.com/browserbase/stagehand/pull/1846) [`335cf47`](https://github.com/browserbase/stagehand/commit/335cf4730e73bce33e92331d04bda4b0fd42685d) Thanks [@aq17](https://github.com/aq17)! - Fix streaming finished event being silently dropped. The final SSE event containing the result payload (success status, message, actions, usage, and messages) was previously discarded instead of being yielded to the caller.

- [#1764](https://github.com/browserbase/stagehand/pull/1764) [`6ba0a1d`](https://github.com/browserbase/stagehand/commit/6ba0a1db7fc2d5d5a2f8927b1417d8f1d15eda10) Thanks [@shrey150](https://github.com/shrey150)! - Expose `headers` in `GoogleVertexProviderSettings` so model configs can pass custom provider headers (for example `X-Goog-Priority`) without TypeScript errors.

- [#1847](https://github.com/browserbase/stagehand/pull/1847) [`4ff3bb8`](https://github.com/browserbase/stagehand/commit/4ff3bb831a6ef6e2d57148e7afb68ea8d23e395d) Thanks [@miguelg719](https://github.com/miguelg719)! - Enable FlowLogger on BROWSERBASE_FLOW_LOGS=1

- [#1752](https://github.com/browserbase/stagehand/pull/1752) [`c27054b`](https://github.com/browserbase/stagehand/commit/c27054bbd0508431ade91d655f89efc87bbf5867) Thanks [@derekmeegan](https://github.com/derekmeegan)! - fix: pause Browserbase agents while captcha solving is active and improve CUA recovery after the solve completes

- [#1800](https://github.com/browserbase/stagehand/pull/1800) [`2abf5b9`](https://github.com/browserbase/stagehand/commit/2abf5b90f1e2bb1442509ef3a686b6128c9cdcf6) Thanks [@shrey150](https://github.com/shrey150)! - Make projectId optional for Browserbase sessions — only BROWSERBASE_API_KEY is required

- [#1766](https://github.com/browserbase/stagehand/pull/1766) [`7817fcc`](https://github.com/browserbase/stagehand/commit/7817fcc315eee4455ce04567cf56c9ec801caf0b) Thanks [@tkattkat](https://github.com/tkattkat)! - Add configurable timeout to tools in agent

- [#1749](https://github.com/browserbase/stagehand/pull/1749) [`7390508`](https://github.com/browserbase/stagehand/commit/73905088c5ed5923d276da9cce2efd0a0a3a46eb) Thanks [@pirate](https://github.com/pirate)! - When connecting to a browser session that has zero open tabs, Stagehand now automatically creates an initial `about:blank` tab so the connection can continue.

- [#1761](https://github.com/browserbase/stagehand/pull/1761) [`611f43a`](https://github.com/browserbase/stagehand/commit/611f43ac8d4c580216d55d2b217c14a9a9c11013) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where handlePossibleNavigation was producing unnecessary error logs on clicks that trigger page close

- [#1817](https://github.com/browserbase/stagehand/pull/1817) [`2402a3c`](https://github.com/browserbase/stagehand/commit/2402a3c4d50270391b3e6440f4385cdcf5e1eb64) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for passing custom headers in clientOptions

## 3.1.0

### Minor Changes

- [#1681](https://github.com/browserbase/stagehand/pull/1681) [`e3db9aa`](https://github.com/browserbase/stagehand/commit/e3db9aa863f44270792215801fe6e3a02a1321aa) Thanks [@tkattkat](https://github.com/tkattkat)! - Add cookie management APIs: `context.addCookies()`, `context.clearCookies()`, & `context.cookies()`

- [#1672](https://github.com/browserbase/stagehand/pull/1672) [`b65756e`](https://github.com/browserbase/stagehand/commit/b65756e9e85643055446aa4a51956f7d6627c89f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add boolean keepAlive parameter to allow for configuring whether the browser should be closed when stagehand.close() is called.

- [#1708](https://github.com/browserbase/stagehand/pull/1708) [`176d420`](https://github.com/browserbase/stagehand/commit/176d42002cc0a2c7d13b4c0ffbbd56b70fdc49e8) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add context.setExtraHTTPHeaders()

- [#1611](https://github.com/browserbase/stagehand/pull/1611) [`8a3c066`](https://github.com/browserbase/stagehand/commit/8a3c06600a9ba98485db7e9ed5c3cc43ea180334) Thanks [@monadoid](https://github.com/monadoid)! - Using `mode` enum instead of old `cua` boolean in openapi spec

### Patch Changes

- [#1683](https://github.com/browserbase/stagehand/pull/1683) [`7584f3e`](https://github.com/browserbase/stagehand/commit/7584f3e92e60a557d2b3e0e0d2a2af04c3527523) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: include shadow DOM in .count() & .nth() & support xpath predicates

- [#1644](https://github.com/browserbase/stagehand/pull/1644) [`1e1c9c1`](https://github.com/browserbase/stagehand/commit/1e1c9c15773e49d5c3cd36021dbc1d23495c1bce) Thanks [@monadoid](https://github.com/monadoid)! - Fix unhandled CDP detaches by returning the original sendCDP promise

- [#1729](https://github.com/browserbase/stagehand/pull/1729) [`6bef890`](https://github.com/browserbase/stagehand/commit/6bef89090ebd231e77d8092b2c32a0f06303d5a9) Thanks [@shrey150](https://github.com/shrey150)! - fix: support Claude 4.6 (Opus and Sonnet) in CUA mode by using the correct `computer_20251124` tool version and `computer-use-2025-11-24` beta header

- [#1647](https://github.com/browserbase/stagehand/pull/1647) [`ffd4b33`](https://github.com/browserbase/stagehand/commit/ffd4b335a873d0f4dcd76ea22d44f47919bf8e49) Thanks [@tkattkat](https://github.com/tkattkat)! - Fix [Agent] - Address bug causing issues with continuing a conversation from past messages in dom mode

- [#1614](https://github.com/browserbase/stagehand/pull/1614) [`677bff5`](https://github.com/browserbase/stagehand/commit/677bff5834c879a2d95f7dbff918b8e1510516b3) Thanks [@miguelg719](https://github.com/miguelg719)! - Enforce <number>-<number> regex validation on act/observe for elementId

- [#1580](https://github.com/browserbase/stagehand/pull/1580) [`65ff464`](https://github.com/browserbase/stagehand/commit/65ff464bc13388eb109eba0a2cf533c1cc202854) Thanks [@tkattkat](https://github.com/tkattkat)! - Add unified variables support across act and agent with a single VariableValue type

- [#1666](https://github.com/browserbase/stagehand/pull/1666) [`101bcf2`](https://github.com/browserbase/stagehand/commit/101bcf2da8b527fd6ace6aa291ada5d0f2d90344) Thanks [@Kylejeong2](https://github.com/Kylejeong2)! - add support for codex models

- [#1728](https://github.com/browserbase/stagehand/pull/1728) [`0a94301`](https://github.com/browserbase/stagehand/commit/0a94301caa991d1aa4cdade6e28a065b1aefb3e2) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - handle potential race condition on `.close()` when using the Stagehand API

- [#1664](https://github.com/browserbase/stagehand/pull/1664) [`b27c04d`](https://github.com/browserbase/stagehand/commit/b27c04d278c290364347acd0c354a878ea9b7c2d) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fixes issue with context.addInitScript() where scripts were not being applied to out of process iframes (OOPIFs), and popup pages with same process iframes (SPIFs)

- [#1632](https://github.com/browserbase/stagehand/pull/1632) [`afbd08b`](https://github.com/browserbase/stagehand/commit/afbd08bb6367a9c9f65f67e453667987e4659918) Thanks [@pirate](https://github.com/pirate)! - Remove automatic `.env` loading via `dotenv`.

  If your app relies on `.env` files, install `dotenv` and load it explicitly in your code:

  ```ts
  import dotenv from "dotenv";
  dotenv.config({ path: ".env" });
  ```

- [#1624](https://github.com/browserbase/stagehand/pull/1624) [`0e8d569`](https://github.com/browserbase/stagehand/commit/0e8d5695f662040f7384e64f46301152802e3c62) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where screenshot masks were not being applied to dialog elements

- [#1596](https://github.com/browserbase/stagehand/pull/1596) [`ff0f979`](https://github.com/browserbase/stagehand/commit/ff0f9795f3b2c1cf4f2610a80ebcb3341a24f987) Thanks [@tkattkat](https://github.com/tkattkat)! - Update usage/metrics handling in agent

- [#1631](https://github.com/browserbase/stagehand/pull/1631) [`2d89d2b`](https://github.com/browserbase/stagehand/commit/2d89d2b35ce812431956b28e0c8b52d32ddc7a27) Thanks [@miguelg719](https://github.com/miguelg719)! - Add right and middle click support to act and observe

- [#1697](https://github.com/browserbase/stagehand/pull/1697) [`aac9a19`](https://github.com/browserbase/stagehand/commit/aac9a19bdfbe62e4508631337ab0bfbcf8ae62b2) Thanks [@shrey150](https://github.com/shrey150)! - fix: support `<frame>` elements in XPath frame boundary detection so `act()` works on legacy `<frameset>` pages

- [#1692](https://github.com/browserbase/stagehand/pull/1692) [`06de50f`](https://github.com/browserbase/stagehand/commit/06de50ff377fd31f1b0fcf79adb996d04562d2c0) Thanks [@shrey150](https://github.com/shrey150)! - fix: skip piercer injection for chrome-extension:// and other non-HTML targets

- [#1613](https://github.com/browserbase/stagehand/pull/1613) [`aa4d981`](https://github.com/browserbase/stagehand/commit/aa4d981e440bdd0e3d3f42ccc310d5958aa25cc6) Thanks [@miguelg719](https://github.com/miguelg719)! - SupportedUnderstudyAction Enum validation for 'method' on act/observe inference

- [#1652](https://github.com/browserbase/stagehand/pull/1652) [`18b1e3b`](https://github.com/browserbase/stagehand/commit/18b1e3bd2b16b721845d52fcf1a45c6158e2403f) Thanks [@miguelg719](https://github.com/miguelg719)! - Add support for gemini 3 flash and pro in hybrid/cua agent

- [#1706](https://github.com/browserbase/stagehand/pull/1706) [`957d82b`](https://github.com/browserbase/stagehand/commit/957d82b9845b4413b123539e81a2e4a490e74a8a) Thanks [@chrisreadsf](https://github.com/chrisreadsf)! - Add GLM to prompt-based JSON fallback for models without native structured output support

- [#1633](https://github.com/browserbase/stagehand/pull/1633) [`22e371a`](https://github.com/browserbase/stagehand/commit/22e371ae4c25deb6350328fe02832bf2b2197b94) Thanks [@tkattkat](https://github.com/tkattkat)! - Add warning when incorrect models are used with agents hybrid mode

- [#1673](https://github.com/browserbase/stagehand/pull/1673) [`d29b91f`](https://github.com/browserbase/stagehand/commit/d29b91fa506636ca36f724fcf106320de54ec3f3) Thanks [@miguelg719](https://github.com/miguelg719)! - Add multi-region support for Stagehand API with region-specific endpoints

- [#1695](https://github.com/browserbase/stagehand/pull/1695) [`7b4f817`](https://github.com/browserbase/stagehand/commit/7b4f817cafb9829ac81c4b5890c318c7f9521fe4) Thanks [@tkattkat](https://github.com/tkattkat)! - Fix: zod bug when pinning zod to v3 and using structured output in agent

- [#1609](https://github.com/browserbase/stagehand/pull/1609) [`3f9ca4d`](https://github.com/browserbase/stagehand/commit/3f9ca4d9acc109101357378d29cf969168991608) Thanks [@miguelg719](https://github.com/miguelg719)! - Add SupportedUnderstudyActions to observe system prompt

- [#1581](https://github.com/browserbase/stagehand/pull/1581) [`49ead1e`](https://github.com/browserbase/stagehand/commit/49ead1e1e8678a8da0f87ad2042491dacc6b01d7) Thanks [@sameelarif](https://github.com/sameelarif)! - **Server-side caching is now available.**

  When running `env: "BROWSERBASE"`, Stagehand automatically caches `act()`, `extract()`, and `observe()` results server-side — repeated calls with the same inputs return instantly without consuming LLM tokens.

  Caching is enabled by default and can be disabled via `serverCache: false` on the Stagehand instance or per individual call. Check out the [browserbase blog](https://www.browserbase.com/blog/stagehand-caching) for more details.

- [#1642](https://github.com/browserbase/stagehand/pull/1642) [`3673369`](https://github.com/browserbase/stagehand/commit/36733691f90c15386cf2a7b47d04ef429b7195ae) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where scripts added via context.addInitScripts() were not being injected into new pages that were opened via popups (eg, clicking a link that opens a new page) and/or calling context.newPage(url)

- [#1735](https://github.com/browserbase/stagehand/pull/1735) [`c465e87`](https://github.com/browserbase/stagehand/commit/c465e87ab41942435132c76338518fb3fa8e7896) Thanks [@monadoid](https://github.com/monadoid)! - Supports request header authentication with connectToMCPServer

- [#1705](https://github.com/browserbase/stagehand/pull/1705) [`ae533e4`](https://github.com/browserbase/stagehand/commit/ae533e40195181b53833f8055b1259fb360a927b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - include error cause in UnderstudyCommandException

- [#1636](https://github.com/browserbase/stagehand/pull/1636) [`ea33052`](https://github.com/browserbase/stagehand/commit/ea330520a325583b71b87d85beb740df4bdb9b2d) Thanks [@miguelg719](https://github.com/miguelg719)! - Include executionModel on the AgentConfigSchema

- [#1679](https://github.com/browserbase/stagehand/pull/1679) [`5764ede`](https://github.com/browserbase/stagehand/commit/5764edee7aab00ef1aafafb68fc56eb26c0a70b2) Thanks [@shrey150](https://github.com/shrey150)! - fix issue where locator.count() was not working with xpaths that have attribute predicates

- [#1646](https://github.com/browserbase/stagehand/pull/1646) [`f09b184`](https://github.com/browserbase/stagehand/commit/f09b184cc5e774736280ae8c94ba3f4f13adda80) Thanks [@miguelg719](https://github.com/miguelg719)! - Add user-agent to CDP connections

- [#1637](https://github.com/browserbase/stagehand/pull/1637) [`a7d29de`](https://github.com/browserbase/stagehand/commit/a7d29decee0f7d12e2437267b9eef1795d3b4e3a) Thanks [@miguelg719](https://github.com/miguelg719)! - Improve error and warning message for legacy model format

- [#1685](https://github.com/browserbase/stagehand/pull/1685) [`d334399`](https://github.com/browserbase/stagehand/commit/d3343990041bf9cd5613569840afb0c17131e33c) Thanks [@tkattkat](https://github.com/tkattkat)! - Bump ai sdk & google provider version

- [#1662](https://github.com/browserbase/stagehand/pull/1662) [`44416da`](https://github.com/browserbase/stagehand/commit/44416da7ff33301bb32d3811e6c3be8782a7d168) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where locator.fill() was not working on elements that require direct value setting

- [#1612](https://github.com/browserbase/stagehand/pull/1612) [`bdd8b4e`](https://github.com/browserbase/stagehand/commit/bdd8b4ee3c697a02728375510ab7fae764990576) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix issue where screenshot mask was only being applied to the first element that the locator resolved to. masks now apply to all matching elements.

## 3.0.8

### Patch Changes

- [#1514](https://github.com/browserbase/stagehand/pull/1514) [`40ce5cc`](https://github.com/browserbase/stagehand/commit/40ce5cc83ec758f4e8c37132a7f4ac8eeea7ca34) Thanks [@tkattkat](https://github.com/tkattkat)! - Rename the close tool in agent to "done"

- [#1574](https://github.com/browserbase/stagehand/pull/1574) [`5506f41`](https://github.com/browserbase/stagehand/commit/5506f416d2609d112b553263984e21d7a30e32b1) Thanks [@tkattkat](https://github.com/tkattkat)! - fix(server): pass cdpUrl to localBrowserLaunchOptions when launchOptions absent

- [#1521](https://github.com/browserbase/stagehand/pull/1521) [`84c05ca`](https://github.com/browserbase/stagehand/commit/84c05ca8de4587181faf128e5c7464fd960caacc) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: get agent cache working in API mode

- [#1486](https://github.com/browserbase/stagehand/pull/1486) [`692ffa0`](https://github.com/browserbase/stagehand/commit/692ffa0346ad3d121686aba503c0a22844293efa) Thanks [@tkattkat](https://github.com/tkattkat)! - improve logging in agent

- [#1551](https://github.com/browserbase/stagehand/pull/1551) [`1ef8901`](https://github.com/browserbase/stagehand/commit/1ef8901e1314e90f43b36be20192e652d3b5598f) Thanks [@miguelg719](https://github.com/miguelg719)! - move extract handler response log to after URL injection

- [#1495](https://github.com/browserbase/stagehand/pull/1495) [`72ac775`](https://github.com/browserbase/stagehand/commit/72ac775a831d6f0f376ceda4426525f93cc21452) Thanks [@tkattkat](https://github.com/tkattkat)! - export tool function & type to simplify defining custom tools

- [#1481](https://github.com/browserbase/stagehand/pull/1481) [`3d5af07`](https://github.com/browserbase/stagehand/commit/3d5af07f66d6d26d1f5ac4bd9be7183c3381dd92) Thanks [@tkattkat](https://github.com/tkattkat)! - add waitForTimeout to page

- [#1423](https://github.com/browserbase/stagehand/pull/1423) [`40e1d80`](https://github.com/browserbase/stagehand/commit/40e1d80776b9216422a25a81070ccb3105e56ec2) Thanks [@miguelg719](https://github.com/miguelg719)! - Improve benchmark handling and add metadata

- [#1588](https://github.com/browserbase/stagehand/pull/1588) [`56c0d24`](https://github.com/browserbase/stagehand/commit/56c0d244f9b2431218bfa832ddfc0587930ae038) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add SnapshotOptions to page.snapshot()

- [#1483](https://github.com/browserbase/stagehand/pull/1483) [`16d72fb`](https://github.com/browserbase/stagehand/commit/16d72fb4c4081dd33bf45605d75c27644ea4c00e) Thanks [@tkattkat](https://github.com/tkattkat)! - Optimize screenshot handling in agent hybrid mode

- [#1498](https://github.com/browserbase/stagehand/pull/1498) [`088c4cc`](https://github.com/browserbase/stagehand/commit/088c4cc31dc924bb232a9d5a09ab42cd961c2d36) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: replaying cached actions (for agent & act) now uses the originally defined model, (instead of default model) when action fails and rerunning inference is needed

- [#1575](https://github.com/browserbase/stagehand/pull/1575) [`4276f4a`](https://github.com/browserbase/stagehand/commit/4276f4abc8bbde215faac6c0321bf243484c376b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - expose port param in localBrowserLaunchOptions

- [#1544](https://github.com/browserbase/stagehand/pull/1544) [`6005786`](https://github.com/browserbase/stagehand/commit/600578637e65f6fd18b0cdb322b9e0b857708b2f) Thanks [@tkattkat](https://github.com/tkattkat)! - Recommend hybrid mode over DOM mode in agent, which is now considered legacy

- [#1505](https://github.com/browserbase/stagehand/pull/1505) [`6fbf5fc`](https://github.com/browserbase/stagehand/commit/6fbf5fc811e5e5d9d22f10c5309fbd336892263a) Thanks [@tkattkat](https://github.com/tkattkat)! - Add structured output to agent result + ensure close tool is always called

- [#1511](https://github.com/browserbase/stagehand/pull/1511) [`704cf18`](https://github.com/browserbase/stagehand/commit/704cf18cb2bdd187ba06c35f05ccb47317a7668c) Thanks [@shrey150](https://github.com/shrey150)! - Fix ControlOrMeta keypress event

- [#1480](https://github.com/browserbase/stagehand/pull/1480) [`091296e`](https://github.com/browserbase/stagehand/commit/091296e438bb2374c8bb10ef6c08283978145ebf) Thanks [@tkattkat](https://github.com/tkattkat)! - Update agent to only calculate xpath when caching is enabled

- [#1509](https://github.com/browserbase/stagehand/pull/1509) [`e56c6eb`](https://github.com/browserbase/stagehand/commit/e56c6eb139bf3aad37e98b16626fff13a6c671d0) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add support for page.waitForSelector()

- [#1478](https://github.com/browserbase/stagehand/pull/1478) [`2cb78d0`](https://github.com/browserbase/stagehand/commit/2cb78d0f5ddef9f7337a9a2fe3137f1421df700a) Thanks [@tkattkat](https://github.com/tkattkat)! - update agent message handling

- [#1518](https://github.com/browserbase/stagehand/pull/1518) [`5dad639`](https://github.com/browserbase/stagehand/commit/5dad63938f08d968d434bb1ee2804f1e54fb836a) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add page.snapshot() for capturing a stringified DOM snapshot of the page, including an xpath map & url map

- [#1576](https://github.com/browserbase/stagehand/pull/1576) [`b7c2571`](https://github.com/browserbase/stagehand/commit/b7c2571ad4ac563f3ca0518e1f29a40da93e33bc) Thanks [@tkattkat](https://github.com/tkattkat)! - utilize waitForSelector when running agent cache

- [#1560](https://github.com/browserbase/stagehand/pull/1560) [`4c69117`](https://github.com/browserbase/stagehand/commit/4c6911748953199dc9aad3eabe98bcf325f871e4) Thanks [@tkattkat](https://github.com/tkattkat)! - Update coordinate handling in cua and hybrid

## 3.0.7

### Patch Changes

- [#1461](https://github.com/browserbase/stagehand/pull/1461) [`0f3991e`](https://github.com/browserbase/stagehand/commit/0f3991eedc0aaff72ef718dda3ddb0839cf4a464) Thanks [@tkattkat](https://github.com/tkattkat)! - Move hybrid mode out of experimental

- [#1433](https://github.com/browserbase/stagehand/pull/1433) [`e0e22e0`](https://github.com/browserbase/stagehand/commit/e0e22e06bc752a8ffde30f3dbfa58d91e24e6c09) Thanks [@tkattkat](https://github.com/tkattkat)! - Put hybrid mode behind experimental

- [#1456](https://github.com/browserbase/stagehand/pull/1456) [`f261051`](https://github.com/browserbase/stagehand/commit/f2610517d74774374de9ee93191e663439ef55e5) Thanks [@shrey150](https://github.com/shrey150)! - Invoke page.hover for agent move action

- [#1473](https://github.com/browserbase/stagehand/pull/1473) [`e021674`](https://github.com/browserbase/stagehand/commit/e021674f9641c1c5f9d0c1817c3fdf599eea124d) Thanks [@shrey150](https://github.com/shrey150)! - Add safety confirmation support for OpenAI + Google CUA

- [#1399](https://github.com/browserbase/stagehand/pull/1399) [`6a5496f`](https://github.com/browserbase/stagehand/commit/6a5496f17dbb716be1ee1aaa4e5ba9d8c723b30b) Thanks [@tkattkat](https://github.com/tkattkat)! - Ensure cua agent is killed when stagehand.close is called

- [#1436](https://github.com/browserbase/stagehand/pull/1436) [`fea1700`](https://github.com/browserbase/stagehand/commit/fea1700552af3319052f463685752501c8e71de3) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix auto-load key for act/extract/observe parametrized models on api

- [#1439](https://github.com/browserbase/stagehand/pull/1439) [`5b288d9`](https://github.com/browserbase/stagehand/commit/5b288d9ac37406ff22460ac8050bea26b87a378e) Thanks [@tkattkat](https://github.com/tkattkat)! - Remove base64 from agent actions array ( still present in messages object )

- [#1408](https://github.com/browserbase/stagehand/pull/1408) [`e822f5a`](https://github.com/browserbase/stagehand/commit/e822f5a8898df9eb48ca32c321025f0c74b638f0) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - allow for act() cache hit when variable values change

- [#1472](https://github.com/browserbase/stagehand/pull/1472) [`638efc7`](https://github.com/browserbase/stagehand/commit/638efc7fea401bc43dd05dceedf4c13a3495a728) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: agent cache not refreshed on action failure

- [#1424](https://github.com/browserbase/stagehand/pull/1424) [`a890f16`](https://github.com/browserbase/stagehand/commit/a890f16fa3a752f308f858e5ab9c9a0faf6b3b34) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: "Error: -32000 Failed to convert response to JSON: CBOR: stack limit exceeded"

- [#1418](https://github.com/browserbase/stagehand/pull/1418) [`934f492`](https://github.com/browserbase/stagehand/commit/934f492ec587bef81f0ce75b45a35b44ab545712) Thanks [@miguelg719](https://github.com/miguelg719)! - Cleanup handlers and bus listeners on close

- [#1430](https://github.com/browserbase/stagehand/pull/1430) [`bd2db92`](https://github.com/browserbase/stagehand/commit/bd2db925f66a826d61d58be1611d55646cbdb560) Thanks [@shrey150](https://github.com/shrey150)! - Fix CUA model coordinate translation

- [#1465](https://github.com/browserbase/stagehand/pull/1465) [`51e0170`](https://github.com/browserbase/stagehand/commit/51e01709ce1c947c1947b4e2cb0b1f4f97b77182) Thanks [@miguelg719](https://github.com/miguelg719)! - Add media resolution high provider option to gemini 3 hybrid agent

- [#1431](https://github.com/browserbase/stagehand/pull/1431) [`05f5580`](https://github.com/browserbase/stagehand/commit/05f5580937c3c157550e3c25ae6671f44f562211) Thanks [@tkattkat](https://github.com/tkattkat)! - Update the cache handling for agent

- [#1432](https://github.com/browserbase/stagehand/pull/1432) [`f56a9c2`](https://github.com/browserbase/stagehand/commit/f56a9c296d4ddce25a405358c66837f8ce4d679f) Thanks [@tkattkat](https://github.com/tkattkat)! - Deprecate cua: true in favor of mode: "cua"

- [#1406](https://github.com/browserbase/stagehand/pull/1406) [`b40ae11`](https://github.com/browserbase/stagehand/commit/b40ae11391af49c3581fce27faa1b7483fc4a169) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for hovering with coordinates ( page.hover )

- [#1407](https://github.com/browserbase/stagehand/pull/1407) [`0d2b398`](https://github.com/browserbase/stagehand/commit/0d2b398cd40b32a9ecaf28ede70853036b7c91bd) Thanks [@tkattkat](https://github.com/tkattkat)! - Clean up page methods

- [#1412](https://github.com/browserbase/stagehand/pull/1412) [`cd01f29`](https://github.com/browserbase/stagehand/commit/cd01f290578eac703521f801ba3712f5332918f3) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: load GOOGLE_API_KEY from .env

- [#1462](https://github.com/browserbase/stagehand/pull/1462) [`a734fca`](https://github.com/browserbase/stagehand/commit/a734fca0b4573753767d3ebc48ec414baf4f23e1) Thanks [@shrey150](https://github.com/shrey150)! - fix: correctly pass userDataDir to chrome launcher

- [#1466](https://github.com/browserbase/stagehand/pull/1466) [`b342acf`](https://github.com/browserbase/stagehand/commit/b342acfaae058127fb57664644c5fd965db02bf2) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - move playwright to optional dependencies

- [#1440](https://github.com/browserbase/stagehand/pull/1440) [`2987cd1`](https://github.com/browserbase/stagehand/commit/2987cd1e5ffabefa9411936609635d4a638faed5) Thanks [@tkattkat](https://github.com/tkattkat)! - [Feature] support excluding tools from agent

- [#1455](https://github.com/browserbase/stagehand/pull/1455) [`dfab1d5`](https://github.com/browserbase/stagehand/commit/dfab1d566299c8c5a63f20565a6da07dc8f61ccd) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - update aisdk client to better enforce structured output with deepseek models

- [#1428](https://github.com/browserbase/stagehand/pull/1428) [`4d71162`](https://github.com/browserbase/stagehand/commit/4d71162beb119635b69b17637564a2bbd0e373e7) Thanks [@tkattkat](https://github.com/tkattkat)! - Add "hybrid" mode to stagehand agent

## 3.0.6

### Patch Changes

- [#1388](https://github.com/browserbase/stagehand/pull/1388) [`605ed6b`](https://github.com/browserbase/stagehand/commit/605ed6b81a3ff8f25d4022f1e5fce6b42aecfc19) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix multiple click event dispatches on CDP and Anthropic CUA handling (double clicks)

- [#1400](https://github.com/browserbase/stagehand/pull/1400) [`34e7e5b`](https://github.com/browserbase/stagehand/commit/34e7e5b292f5e6af6efc0da60118663310c5f718) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - don't write base64 encoded screenshots to disk when caching agent actions

- [#1345](https://github.com/browserbase/stagehand/pull/1345) [`943d2d7`](https://github.com/browserbase/stagehand/commit/943d2d79d0f289ac41c9164578f2f1dd876058f2) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for aborting / stopping an agent run & continuing an agent run using messages from prior runs

- [#1334](https://github.com/browserbase/stagehand/pull/1334) [`0e95cd2`](https://github.com/browserbase/stagehand/commit/0e95cd2f67672f64f0017024fd47d8b3aef59a95) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for google vertex provider

- [#1410](https://github.com/browserbase/stagehand/pull/1410) [`d4237e4`](https://github.com/browserbase/stagehand/commit/d4237e40951ecd10abfdbe766672d498f8806484) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: include extract in stagehand.history()

- [#1315](https://github.com/browserbase/stagehand/pull/1315) [`86975e7`](https://github.com/browserbase/stagehand/commit/86975e795db7505804949a267b20509bd16b5256) Thanks [@tkattkat](https://github.com/tkattkat)! - Add streaming support to agent through stream:true in the agent config

- [#1304](https://github.com/browserbase/stagehand/pull/1304) [`d5e119b`](https://github.com/browserbase/stagehand/commit/d5e119be5eec84915a79f8d611b6ba0546f48c99) Thanks [@miguelg719](https://github.com/miguelg719)! - Add support for Microsoft's Fara-7B

- [#1346](https://github.com/browserbase/stagehand/pull/1346) [`4e051b2`](https://github.com/browserbase/stagehand/commit/4e051b23add7ae276b0dbead38b4587838cfc1c1) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: don't attach to targets twice

- [#1327](https://github.com/browserbase/stagehand/pull/1327) [`6b5a3c9`](https://github.com/browserbase/stagehand/commit/6b5a3c9035654caaed2da375085b465edda97de4) Thanks [@miguelg719](https://github.com/miguelg719)! - Informed error parsing from api

- [#1335](https://github.com/browserbase/stagehand/pull/1335) [`bb85ad9`](https://github.com/browserbase/stagehand/commit/bb85ad912738623a7a866f0cb6e8d5807c6c2738) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add support for page.addInitScript()

- [#1331](https://github.com/browserbase/stagehand/pull/1331) [`88d28cc`](https://github.com/browserbase/stagehand/commit/88d28cc6f31058d1cf6ec6dc948a4ae77a926b3c) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: page.evaluate() now works with scripts injected via context.addInitScript()

- [#1316](https://github.com/browserbase/stagehand/pull/1316) [`45bcef0`](https://github.com/browserbase/stagehand/commit/45bcef0e5788b083f9e38dfd7c3bc63afcd4b6dd) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for callbacks in stagehand agent

- [#1374](https://github.com/browserbase/stagehand/pull/1374) [`6aa9d45`](https://github.com/browserbase/stagehand/commit/6aa9d455aa5836ec2ee8ab2e8b9df3fb218e5381) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix key action mapping in Anthropic CUA

- [#1330](https://github.com/browserbase/stagehand/pull/1330) [`d382084`](https://github.com/browserbase/stagehand/commit/d382084745fff98c3e71413371466394a2625429) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: make act, extract, and observe respect user defined timeout param

- [#1336](https://github.com/browserbase/stagehand/pull/1336) [`1df08cc`](https://github.com/browserbase/stagehand/commit/1df08ccb0a2cf73b5c37a91c129721114ff6371c) Thanks [@tkattkat](https://github.com/tkattkat)! - Patch agent on api

- [#1358](https://github.com/browserbase/stagehand/pull/1358) [`2b56600`](https://github.com/browserbase/stagehand/commit/2b566009606fcbba987260f21b075b318690ce99) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for 4.5 opus in cua agent

## 3.0.4

### Patch Changes

- [#1281](https://github.com/browserbase/stagehand/pull/1281) [`fa18cfd`](https://github.com/browserbase/stagehand/commit/fa18cfdc45f28e35e6566587b54612396e6ece45) Thanks [@monadoid](https://github.com/monadoid)! - Add Browserbase session URL and debug URL accessors

- [#1264](https://github.com/browserbase/stagehand/pull/1264) [`767d168`](https://github.com/browserbase/stagehand/commit/767d1686285cf9c57675595f553f8a891f13c63b) Thanks [@Kylejeong2](https://github.com/Kylejeong2)! - feat: adding gpt 5.1 to stagehand

- [#1282](https://github.com/browserbase/stagehand/pull/1282) [`f27a99c`](https://github.com/browserbase/stagehand/commit/f27a99c11b020b33736fe67af8f7f0e663c6f45f) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for zod 4, while maintaining backwards compatibility for zod 3

- [#1295](https://github.com/browserbase/stagehand/pull/1295) [`91a1ca0`](https://github.com/browserbase/stagehand/commit/91a1ca07d9178c46269bfb951abb20a215eb7c29) Thanks [@tkattkat](https://github.com/tkattkat)! - Patch zod handling of non objects in extract

- [#1298](https://github.com/browserbase/stagehand/pull/1298) [`1dd7d43`](https://github.com/browserbase/stagehand/commit/1dd7d4330de9022dc6cd45a8b5c86cb9e1b575ec) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - log Browserbase session status when websocket is closed due to session timeout

- [#1284](https://github.com/browserbase/stagehand/pull/1284) [`c0f3b98`](https://github.com/browserbase/stagehand/commit/c0f3b98277c15c77b2b4c3f55503e61ef3d27cf3) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: waitForDomNetworkQuiet() causing `act()` to hang indefinitely

- [#1246](https://github.com/browserbase/stagehand/pull/1246) [`44bb4f5`](https://github.com/browserbase/stagehand/commit/44bb4f51dcccbdca8df07e4d7f8d28a7e6e793ec) Thanks [@filip-michalsky](https://github.com/filip-michalsky)! - make ci faster

- [#1300](https://github.com/browserbase/stagehand/pull/1300) [`2b70347`](https://github.com/browserbase/stagehand/commit/2b7034771bc6d6b1fabb13deaa56c299881b3728) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add support for context.addInitScript()

## 3.0.3

### Patch Changes

- [#1273](https://github.com/browserbase/stagehand/pull/1273) [`ab51232`](https://github.com/browserbase/stagehand/commit/ab51232db428be048957c0f5d67f2176eb7a5194) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: trigger shadow root rerender in OOPIFs by cloning & replacing instead of reloading

- [#1268](https://github.com/browserbase/stagehand/pull/1268) [`c76ade0`](https://github.com/browserbase/stagehand/commit/c76ade009ef81208accae6475ec4707d3906e566) Thanks [@tkattkat](https://github.com/tkattkat)! - Expose reasoning, and cached input tokens in stagehand metrics

- [#1267](https://github.com/browserbase/stagehand/pull/1267) [`ffb5e5d`](https://github.com/browserbase/stagehand/commit/ffb5e5d2ab49adcb2efdfc9e5c76e8c96268b5b3) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: file uploads failing on Browserbase

- [#1269](https://github.com/browserbase/stagehand/pull/1269) [`772e735`](https://github.com/browserbase/stagehand/commit/772e73543e45106d7fa0fafd95ade46ae11023bc) Thanks [@tkattkat](https://github.com/tkattkat)! - Add example using playwright screen recording

## 3.0.2

### Patch Changes

- [#1245](https://github.com/browserbase/stagehand/pull/1245) [`a224b33`](https://github.com/browserbase/stagehand/commit/a224b3371b6c1470baf342742fb745c7192b52c6) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - allow act() to call hover()

- [#1234](https://github.com/browserbase/stagehand/pull/1234) [`6fc9de2`](https://github.com/browserbase/stagehand/commit/6fc9de2a1079e4f2fb0b1633d8df0bb7a9f7f89f) Thanks [@miguelg719](https://github.com/miguelg719)! - Add a page.sendCDP method

- [#1233](https://github.com/browserbase/stagehand/pull/1233) [`4935be7`](https://github.com/browserbase/stagehand/commit/4935be788b3431527f3d110864c0fd7060cfaf7c) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - extend page.screenshot() options to mirror playwright

- [#1232](https://github.com/browserbase/stagehand/pull/1232) [`bdd76fc`](https://github.com/browserbase/stagehand/commit/bdd76fcd1e48079fc5ab8cf040ebb5997dfc6c99) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - export Page type

- [#1229](https://github.com/browserbase/stagehand/pull/1229) [`7ea18a4`](https://github.com/browserbase/stagehand/commit/7ea18a420fc033d1b72556db83a1f41735e5a022) Thanks [@tkattkat](https://github.com/tkattkat)! - Adjust extract tool + expose extract response in agent result

- [#1239](https://github.com/browserbase/stagehand/pull/1239) [`d4de014`](https://github.com/browserbase/stagehand/commit/d4de014235a18f9e1089240bc72e28cbfe77ca1c) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix stagehand.metrics on api mode

- [#1241](https://github.com/browserbase/stagehand/pull/1241) [`2d1b573`](https://github.com/browserbase/stagehand/commit/2d1b5732dc441a3331f5743cdfed3e1037d8b3b5) Thanks [@miguelg719](https://github.com/miguelg719)! - Return response on page.goto api mode

- [#1253](https://github.com/browserbase/stagehand/pull/1253) [`5556041`](https://github.com/browserbase/stagehand/commit/5556041e2deaed5012363303fd7a8ac00e3242cd) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix missing page issue when connecting to existing browser

- [#1235](https://github.com/browserbase/stagehand/pull/1235) [`7e4b43e`](https://github.com/browserbase/stagehand/commit/7e4b43ed46fbdd2074827e87d9a245e2dc96456b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - make page.goto() return a Response object

- [#1254](https://github.com/browserbase/stagehand/pull/1254) [`7e72adf`](https://github.com/browserbase/stagehand/commit/7e72adfd7e4af5ec49ac2f552e7f1f57c1acc554) Thanks [@sameelarif](https://github.com/sameelarif)! - Added custom error types to allow for a smoother debugging experience.

- [#1227](https://github.com/browserbase/stagehand/pull/1227) [`9bf09d0`](https://github.com/browserbase/stagehand/commit/9bf09d041111870d71cb9ffcb3ac5fa2c4b1399d) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix readme's media links and add instructions for installing from a branch

- [#1257](https://github.com/browserbase/stagehand/pull/1257) [`92d32ea`](https://github.com/browserbase/stagehand/commit/92d32eafe91a4241615cc65501b8461c6074a02b) Thanks [@tkattkat](https://github.com/tkattkat)! - Add support for a custom baseUrl with google cua client

- [#1230](https://github.com/browserbase/stagehand/pull/1230) [`ebcf3a1`](https://github.com/browserbase/stagehand/commit/ebcf3a1ffa859374d71de4931c6a9b982a565e46) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add stagehand.browserbaseSessionID getter

- [#1262](https://github.com/browserbase/stagehand/pull/1262) [`c29a4f2`](https://github.com/browserbase/stagehand/commit/c29a4f2eca91ae2902ed9d48b2385b4436f7b664) Thanks [@miguelg719](https://github.com/miguelg719)! - Remove error throwing when api and experimental are both set

- [#1223](https://github.com/browserbase/stagehand/pull/1223) [`6d21efa`](https://github.com/browserbase/stagehand/commit/6d21efa8b30317aa3ce3e37ac6c2222af3b967b5) Thanks [@miguelg719](https://github.com/miguelg719)! - Disable api mode when using custom LLM clients

- [#1228](https://github.com/browserbase/stagehand/pull/1228) [`525ef0c`](https://github.com/browserbase/stagehand/commit/525ef0c1243aaf3452ee7e4ea81b4208f4c2efd1) Thanks [@Kylejeong2](https://github.com/Kylejeong2)! - update slack link in docs

- [#1226](https://github.com/browserbase/stagehand/pull/1226) [`9ddb872`](https://github.com/browserbase/stagehand/commit/9ddb872e350358214e12a91cf6a614fd2ec1f74c) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - add support for page.on('console') events

## 3.0.1

### Patch Changes

- [#1207](https://github.com/browserbase/stagehand/pull/1207) [`55da8c6`](https://github.com/browserbase/stagehand/commit/55da8c6e9575cbad3246c55b17650cf6b293ddbe) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix broken links to quickstart docs

- [#1200](https://github.com/browserbase/stagehand/pull/1200) [`0a5ee63`](https://github.com/browserbase/stagehand/commit/0a5ee638bde051d109eb2266e665934a12f3dc31) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - log info when scope narrowing selector fails

- [#1205](https://github.com/browserbase/stagehand/pull/1205) [`ee76881`](https://github.com/browserbase/stagehand/commit/ee7688156cb67a9f0f90dfe0dbab77423693a332) Thanks [@miguelg719](https://github.com/miguelg719)! - Update README.md, add Changelog for v3

- [#1209](https://github.com/browserbase/stagehand/pull/1209) [`9e95add`](https://github.com/browserbase/stagehand/commit/9e95add37eb30db4f85e73df7760c7e63fb4131e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix circular import in exported aisdk example client

- [#1211](https://github.com/browserbase/stagehand/pull/1211) [`98e212b`](https://github.com/browserbase/stagehand/commit/98e212b27887241879608c6c1b6c2524477a40d7) Thanks [@miguelg719](https://github.com/miguelg719)! - Add an example for passing custom tools to agent

- [#1206](https://github.com/browserbase/stagehand/pull/1206) [`d5ecbfc`](https://github.com/browserbase/stagehand/commit/d5ecbfc8e419a59b91c2115fd7f984378381d3d0) Thanks [@miguelg719](https://github.com/miguelg719)! - Export example AISdkClient properly from the stagehand package


================================================
FILE: packages/core/README.md
================================================
<div id="toc" align="center" style="margin-bottom: 0;">
  <ul style="list-style: none; margin: 0; padding: 0;">
    <a href="https://stagehand.dev">
      <picture>
        <source media="(prefers-color-scheme: dark)" srcset="../../media/dark_logo.png" />
        <img alt="Stagehand" src="../../media/light_logo.png" width="200" style="margin-right: 30px;" />
      </picture>
    </a>
  </ul>
</div>
<p align="center">
  <strong>The AI Browser Automation Framework</strong><br>
  <a href="https://docs.stagehand.dev">Read the Docs</a>
</p>

<p align="center">
  <a href="https://github.com/browserbase/stagehand/tree/main?tab=MIT-1-ov-file#MIT-1-ov-file">
    <picture>
      <source media="(prefers-color-scheme: dark)" srcset="../../media/dark_license.svg" />
      <img alt="MIT License" src="../../media/light_license.svg" />
    </picture>
  </a>
  <a href="https://stagehand.dev/discord">
    <picture>
      <source media="(prefers-color-scheme: dark)" srcset="../../media/dark_discord.svg" />
      <img alt="Discord Community" src="../../media/light_discord.svg" />
    </picture>
  </a>
</p>

<p align="center">
	<a href="https://trendshift.io/repositories/12122" target="_blank"><img src="https://trendshift.io/api/badge/repositories/12122" alt="browserbase%2Fstagehand | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
</p>

<p align="center">
  <a href="https://deepwiki.com/browserbase/stagehand">
    <img alt="Ask DeepWiki" src="https://deepwiki.com/badge.svg" />
  </a>
</p>

<p align="center">
If you're looking for the Python implementation, you can find it 
<a href="https://github.com/browserbase/stagehand-python"> here</a>
</p>

<div align="center" style="display: flex; align-items: center; justify-content: center; gap: 4px; margin-bottom: 0;">
  <b>Vibe code</b>
  <span style="font-size: 1.05em;"> Stagehand with </span>
  <a href="https://director.ai" style="display: flex; align-items: center;">
    <span>Director</span>
  </a>
  <span> </span>
  <picture>
    <img alt="Director" src="../../media/director_icon.svg" width="25" />
  </picture>
</div>

## What is Stagehand?

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## Why Stagehand?

Most existing browser automation tools either require you to write low-level code in a framework like Selenium, Playwright, or Puppeteer, or use high-level agents that can be unpredictable in production. By letting developers choose what to write in code vs. natural language (and bridging the gap between the two) Stagehand is the natural choice for browser automations in production.

1. **Choose when to write code vs. natural language**: use AI when you want to navigate unfamiliar pages, and use code when you know exactly what you want to do.

2. **Go from AI-driven to repeatable workflows**: Stagehand lets you preview AI actions before running them, and also helps you easily cache repeatable actions to save time and tokens.

3. **Write once, run forever**: Stagehand's auto-caching combined with self-healing remembers previous actions, runs without LLM inference, and knows when to involve AI whenever the website changes and your automation breaks.

## Getting Started

Start with Stagehand with one line of code, or check out our [Quickstart Guide](https://docs.stagehand.dev/v3/first-steps/quickstart) for more information:

```bash
npx create-browser-app
```

## Example

Here's how to build a sample browser automation with Stagehand:

```typescript
// Stagehand's CDP engine provides an optimized, low level interface to the browser built for automation
const page = stagehand.context.pages()[0];
await page.goto("https://github.com/browserbase");

// Use act() to execute individual actions
await stagehand.act("click on the stagehand repo");

// Use agent() for multi-step tasks
const agent = stagehand.agent();
await agent.execute("Get to the latest PR");

// Use extract() to get structured data from the page
const { author, title } = await stagehand.extract(
  "extract the author and title of the PR",
  z.object({
    author: z.string().describe("The username of the PR author"),
    title: z.string().describe("The title of the PR"),
  }),
);
```

## Documentation

Visit [docs.stagehand.dev](https://docs.stagehand.dev) to view the full documentation.

### Build and Run from Source

```bash
git clone https://github.com/browserbase/stagehand.git
cd stagehand
pnpm install
pnpm run build
pnpm run example # run the blank script at ./examples/example.ts
```

Stagehand is best when you have an API key for an LLM provider and Browserbase credentials. To add these to your project, run:

```bash
cp .env.example .env
nano .env # Edit the .env file to add API keys
```

### Installing from a branch

You can install and build Stagehand directly from a github branch using [gitpkg](https://github.com/EqualMa/gitpkg)

In your project's `package.json` set:

```json
"@browserbasehq/stagehand": "https://gitpkg.now.sh/browserbase/stagehand/packages/core?<branchName>",
```

## Contributing

> [!NOTE]
> We highly value contributions to Stagehand! For questions or support, please join our [Discord community](https://stagehand.dev/discord).

At a high level, we're focused on improving reliability, extensibility, speed, and cost in that order of priority. If you're interested in contributing, **bug fixes and small improvements are the best way to get started**. For more involved features, we strongly recommend reaching out to [Miguel Gonzalez](https://x.com/miguel_gonzf) or [Paul Klein](https://x.com/pk_iv) in our [Discord community](https://stagehand.dev/discord) before starting to ensure that your contribution aligns with our goals.

<!-- For more information, please see our [Contributing Guide](https://docs.stagehand.dev/examples/contributing). -->

## Acknowledgements

We'd like to thank the following people for their major contributions to Stagehand:

- [Paul Klein](https://github.com/pkiv)
- [Sean McGuire](https://github.com/seanmcguire12)
- [Miguel Gonzalez](https://github.com/miguelg719)
- [Sameel Arif](https://github.com/sameelarif)
- [Thomas Katwan](https://github.com/tkattkat)
- [Filip Michalsky](https://github.com/filip-michalsky)
- [Anirudh Kamath](https://github.com/kamath)
- [Jeremy Press](https://x.com/jeremypress)
- [Navid Pour](https://github.com/navidpour)

## License

Licensed under the MIT License.

Copyright 2025 Browserbase, Inc.


================================================
FILE: packages/core/examples/2048.ts
================================================
import { Stagehand } from "../lib/v3/index.js";
import { z } from "zod";

async function example() {
  console.log("🎮 Starting 2048 bot...");
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 1,
  });

  console.log("🌟 Initializing Stagehand...");
  await stagehand.init();
  const page = stagehand.context.pages()[0];
  try {
    console.log("🌐 Navigating to 2048...");
    await page.goto("https://ovolve.github.io/2048-AI/");
    // Main game loop
    while (true) {
      console.log("🔄 Game loop iteration...");
      // Add a small delay for UI updates
      await new Promise((resolve) => setTimeout(resolve, 300));
      // Get current game state
      const gameState = await stagehand.extract(
        `Extract the current game state:
          1. Score from the score counter
          2. All tile values in the 4x4 grid (empty spaces as 0)
          3. Highest tile value present`,
        z.object({
          score: z.number(),
          highestTile: z.number(),
          grid: z.array(z.array(z.number())),
        }),
      );
      const transposedGrid = gameState.grid[0].map((_, colIndex) =>
        gameState.grid.map((row) => row[colIndex]),
      );
      const grid = transposedGrid.map((row, rowIndex) => ({
        [`row${rowIndex + 1}`]: row,
      }));
      console.log("Game State:", {
        score: gameState.score,
        highestTile: gameState.highestTile,
        grid: grid,
      });
      // Analyze board and decide next move
      const analysis = await stagehand.extract(
        `Based on the current game state:
          - Score: ${gameState.score}
          - Highest tile: ${gameState.highestTile}
          - Grid: This is a 4x4 matrix ordered by row (top to bottom) and column (left to right). The rows are stacked vertically, and tiles can move vertically between rows or horizontally between columns:\n${grid
            .map((row) => {
              const rowName = Object.keys(row)[0];
              return `             ${rowName}: ${row[rowName].join(", ")}`;
            })
            .join("\n")}
          What is the best move (up/down/left/right)? Consider:
          1. Keeping high value tiles in corners (bottom left, bottom right, top left, top right)
          2. Maintaining a clear path to merge tiles
          3. Avoiding moves that could block merges
          4. Only adjacent tiles of the same value can merge
          5. Making a move will move all tiles in that direction until they hit a tile of a different value or the edge of the board
          6. Tiles cannot move past the edge of the board
          7. Each move must move at least one tile`,
        z.object({
          move: z.enum(["up", "down", "left", "right"]),
          confidence: z.number(),
          reasoning: z.string(),
        }),
      );
      console.log("Move Analysis:", analysis);
      const moveKey = {
        up: "ArrowUp",
        down: "ArrowDown",
        left: "ArrowLeft",
        right: "ArrowRight",
      }[analysis.move];
      await page.keyPress(moveKey);
      console.log("🎯 Executed move:", analysis.move);
    }
  } catch (error) {
    console.error("❌ Error in game loop:", error);
    const isGameOver = await page.evaluate(() => {
      return document.querySelector(".game-over") !== null;
    });
    if (isGameOver) {
      console.log("🏁 Game Over!");
      return;
    }
    throw error; // Re-throw non-game-over errors
  }
}
(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/CHANGELOG.md
================================================
# @browserbasehq/stagehand-examples

## 1.0.9

### Patch Changes

- Updated dependencies [[`09b5e1e`](https://github.com/browserbase/stagehand/commit/09b5e1e9c23c845903686db6665cc968ac34efbb), [`e3734b9`](https://github.com/browserbase/stagehand/commit/e3734b9c98352d5f0a4eca49791b0bbf2130ab41), [`8244ab2`](https://github.com/browserbase/stagehand/commit/8244ab247cd679962685ae2f7c54e874ce1fa614), [`be85b19`](https://github.com/browserbase/stagehand/commit/be85b19679a826f19702e00f0aae72fce1118ec8), [`88d1565`](https://github.com/browserbase/stagehand/commit/88d1565c65bb65a104fea2d5f5e862bbbda69677), [`ab5d6ed`](https://github.com/browserbase/stagehand/commit/ab5d6ede19aabc059badc4247f1cb2c6c9e71bae)]:
  - @browserbasehq/stagehand@2.5.0

## 1.0.8

### Patch Changes

- Updated dependencies [[`9e8c173`](https://github.com/browserbase/stagehand/commit/9e8c17374fdc8fbe7f26e6cf802c36bd14f11039)]:
  - @browserbasehq/stagehand@2.4.4

## 1.0.7

### Patch Changes

- Updated dependencies [[`f45afdc`](https://github.com/browserbase/stagehand/commit/f45afdccc8680650755fee66ffbeac32b41e075d), [`261bba4`](https://github.com/browserbase/stagehand/commit/261bba43fa79ac3af95328e673ef3e9fced3279b), [`8de7bd8`](https://github.com/browserbase/stagehand/commit/8de7bd8635c2051cd8025e365c6c8aa83d81c7e7), [`3d80421`](https://github.com/browserbase/stagehand/commit/3d804210a106a6828c7fa50f8b765b10afd4cc6a), [`0ead63d`](https://github.com/browserbase/stagehand/commit/0ead63d6526f6c286362b74b6407c8bebc900e69), [`8422828`](https://github.com/browserbase/stagehand/commit/8422828c4cd5fd5ebcf348cfbdb40c768bb76dd9), [`b769206`](https://github.com/browserbase/stagehand/commit/b7692060f98a2f49aeeefb90d8789ed034b08ec2), [`72d2683`](https://github.com/browserbase/stagehand/commit/72d2683202af7e578d98367893964b33e0828de5)]:
  - @browserbasehq/stagehand@2.4.3

## 1.0.6

### Patch Changes

- Updated dependencies [[`6b4e6e3`](https://github.com/browserbase/stagehand/commit/6b4e6e3f31d5496cf15728e9018eddeb04839542), [`e77d018`](https://github.com/browserbase/stagehand/commit/e77d0188683ebf596dfb78dfafbbca1dc32993f0), [`c20adb9`](https://github.com/browserbase/stagehand/commit/c20adb95539fed8c56a4aa413262a9c65a8e6474), [`b86df93`](https://github.com/browserbase/stagehand/commit/b86df93b9136aae96292121a29c25f3d74d84bf7), [`023c2c2`](https://github.com/browserbase/stagehand/commit/023c2c273b46d3792d7e5d3c902089487b16b531), [`8c28647`](https://github.com/browserbase/stagehand/commit/8c2864755ecd05c8f7de235d4198deec0dd5f78e), [`87e09c6`](https://github.com/browserbase/stagehand/commit/87e09c618940f364ec8af00455a19a17ec63cbd3), [`a611115`](https://github.com/browserbase/stagehand/commit/a61111525d70b450bdfc43f112380f44899c9e97), [`69913fe`](https://github.com/browserbase/stagehand/commit/69913fe1dfb8201ae2aeffa5f049fb46ab02cbc2), [`b1b83a1`](https://github.com/browserbase/stagehand/commit/b1b83a1d334fe76e5f5f9dd32dc92c16b7d40ce6), [`be8497c`](https://github.com/browserbase/stagehand/commit/be8497cb6b142cc893cea9692b8c47bd19514c60), [`98704c9`](https://github.com/browserbase/stagehand/commit/98704c9ed225ca25bbde4bb3dc286936e9c54471), [`04978bd`](https://github.com/browserbase/stagehand/commit/04978bdd30d2edcbc69eb9fd91358a16975ea2eb)]:
  - @browserbasehq/stagehand@2.4.2

## 1.0.5

### Patch Changes

- Updated dependencies [[`8a43c5a`](https://github.com/browserbase/stagehand/commit/8a43c5a86d4da40cfaedd9cf2e42186928bdf946), [`890ffcc`](https://github.com/browserbase/stagehand/commit/890ffccac5e0a60ade64a46eb550c981ffb3e84a), [`64c1072`](https://github.com/browserbase/stagehand/commit/64c10727bda50470483a3eb175c02842db0923a1), [`b077d3f`](https://github.com/browserbase/stagehand/commit/b077d3f48a97f47a71ccc79ae39b41e7f07f9c04), [`8bcb5d7`](https://github.com/browserbase/stagehand/commit/8bcb5d77debf6bf7601fd5c090efd7fde75c5d5e), [`7bf10c5`](https://github.com/browserbase/stagehand/commit/7bf10c55b267078fe847c1d7f7a60d604f9c7c94)]:
  - @browserbasehq/stagehand@2.4.1

## 1.0.4

### Patch Changes

- Updated dependencies [[`124e0d3`](https://github.com/browserbase/stagehand/commit/124e0d3bb54ddb6738ede6d7aa99a945ef1cacd1), [`6a18c1e`](https://github.com/browserbase/stagehand/commit/6a18c1ee1e46d55c6e90c4d5572e17ed8daa140c), [`1660751`](https://github.com/browserbase/stagehand/commit/1660751cd14cb5b27d44f8167216afb8d1c3c45c), [`cadac9d`](https://github.com/browserbase/stagehand/commit/cadac9da09123d12e5d496a0e8b12660964c1b33), [`759da55`](https://github.com/browserbase/stagehand/commit/759da55775eb2df81d56ae18c0f386fd9b02a9f0), [`a175a51`](https://github.com/browserbase/stagehand/commit/a175a519b8c14300db6f1ed30709e113d18e99db), [`8527a80`](https://github.com/browserbase/stagehand/commit/8527a80522c3eedb9516a6caa1a0e4e4be981a3d), [`55fca2f`](https://github.com/browserbase/stagehand/commit/55fca2f7da63cc0ef6e27b45a33f63c666cdce7e)]:
  - @browserbasehq/stagehand@2.4.0

## 1.0.3

### Patch Changes

- Updated dependencies [[`12a99b3`](https://github.com/browserbase/stagehand/commit/12a99b398d8a4c3eea3ca69a3cf793faaaf4aea3), [`2451797`](https://github.com/browserbase/stagehand/commit/2451797f64c0efa4a72fd70265110003c8d0a6cd), [`1d631a5`](https://github.com/browserbase/stagehand/commit/1d631a57a197390f672b718ae5199991ab27cfb1), [`9c398bb`](https://github.com/browserbase/stagehand/commit/9c398bb9ec2d10bdb53ad5aa7e3b58cce24fdb2b), [`c19ad7f`](https://github.com/browserbase/stagehand/commit/c19ad7f1e082e91fdeaa9c2ef63767a5a2b3a195)]:
  - @browserbasehq/stagehand@2.3.1

## 1.0.2

### Patch Changes

- Updated dependencies [[`5680d25`](https://github.com/browserbase/stagehand/commit/5680d2509352c383ad502c9f4fabde01fa638833), [`4de92a8`](https://github.com/browserbase/stagehand/commit/4de92a8af461fc95063faf39feee1d49259f58ba), [`6ef6073`](https://github.com/browserbase/stagehand/commit/6ef60730cab0ad9025f44b6eeb2c83751d1dcd35)]:
  - @browserbasehq/stagehand@2.3.0

## 1.0.1

### Patch Changes

- Updated dependencies [[`be8652e`](https://github.com/browserbase/stagehand/commit/be8652e770b57fdb3299fa0b2efa4eb0e816434e), [`6b413b7`](https://github.com/browserbase/stagehand/commit/6b413b7ad00b13ca0bd53ee2e7393023821408b6), [`7eafbd9`](https://github.com/browserbase/stagehand/commit/7eafbd9b1a73b37effa444929767df7c592caf02), [`1b50aa6`](https://github.com/browserbase/stagehand/commit/1b50aa61cf0a429dd6cb2760a08f7f698a50454b), [`f2b7f1f`](https://github.com/browserbase/stagehand/commit/f2b7f1f284eef1f96753319b66c7d0b273a6f8cd), [`c8d672f`](https://github.com/browserbase/stagehand/commit/c8d672f7c410c256defbc2e87ead99239837aa28), [`bebf204`](https://github.com/browserbase/stagehand/commit/bebf2044502333c694743078c5b0c9deae11fb79), [`37d6810`](https://github.com/browserbase/stagehand/commit/37d6810a704773d0383a86f98f5f17c7d5b21975)]:
  - @browserbasehq/stagehand@2.2.1


================================================
FILE: packages/core/examples/actionable_observe_example.ts
================================================
/**
 * This example shows how to use actionable observe()
 *
 * You can use observe to get a cache-able Playwright action as JSON, then pass that JSON to act() to perform the action.
 *
 * This is useful for:
 * - Previewing actions before running them
 * - Saving actions to a file and replaying them later
 * - Hiding sensitive information from LLMs
 *
 * For more on caching, see: https://docs.stagehand.dev/examples/caching
 * Also check out the form_filling_sensible.ts example for a more complex example of using observe() to fill out a form.
 */

import { Action, Stagehand } from "../lib/v3/index.js";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
  });
  await stagehand.init();
  const page = stagehand.context.pages()[0];

  await page.goto("https://www.apartments.com/san-francisco-ca/");

  let observation: Action;

  await new Promise((resolve) => setTimeout(resolve, 3000));
  [observation] = await stagehand.observe("find the 'all filters' button");
  await stagehand.act(observation);

  await new Promise((resolve) => setTimeout(resolve, 3000));
  [observation] = await stagehand.observe(
    "find the '1+' button in the 'beds' section",
  );
  await stagehand.act(observation);

  await new Promise((resolve) => setTimeout(resolve, 3000));
  [observation] = await stagehand.observe(
    "find the 'apartments' button in the 'home type' section",
  );
  await stagehand.act(observation);

  await new Promise((resolve) => setTimeout(resolve, 3000));
  [observation] = await stagehand.observe(
    "find the pet policy dropdown to click on.",
  );
  await stagehand.act(observation);

  await new Promise((resolve) => setTimeout(resolve, 3000));
  [observation] = await stagehand.observe(
    "find the 'Dog Friendly' option to click on",
  );
  await stagehand.act(observation);

  await new Promise((resolve) => setTimeout(resolve, 3000));
  [observation] = await stagehand.observe("find the 'see results' section");
  await stagehand.act(observation);

  const currentUrl = page.url();
  await stagehand.close();
  if (
    currentUrl.includes(
      "https://www.apartments.com/apartments/san-francisco-ca/min-1-bedrooms-pet-friendly-dog/",
    )
  ) {
    console.log("✅ Success! we made it to the correct page");
  } else {
    console.log(
      "❌ Whoops, looks like we didn't make it to the correct page. " +
        "\nThanks for testing out this new Stagehand feature!" +
        "\nReach us on Discord if you have any feedback/questions/suggestions!",
    );
  }
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/agent-custom-tools.ts
================================================
/**
 * This example shows how to pass custom tools to stagehand agent (both CUA and non-CUA)
 */
import { z } from "zod";
import { tool } from "ai";
import { Stagehand } from "../lib/v3/index.js";
import chalk from "chalk";

// Mock weather API, replace with your own API/tool logic
// eslint-disable-next-line @typescript-eslint/no-unused-vars
const fetchWeatherAPI = async (location: string) => {
  return {
    temp: 70,
    conditions: "sunny",
  };
};

// Define the tool in an AI SDK format
const getWeather = tool({
  description: "Get the current weather in a location",
  inputSchema: z.object({
    location: z.string().describe("The location to get weather for"),
  }),
  execute: async ({ location }) => {
    // Your custom logic here
    const weather = await fetchWeatherAPI(location);
    return {
      location,
      temperature: weather.temp,
      conditions: weather.conditions,
    };
  },
});

async function main() {
  console.log(
    `\n${chalk.bold("Stagehand 🤘 Computer Use Agent (CUA) Demo")}\n`,
  );

  // Initialize Stagehand
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 2,
    experimental: true, // You must enable experimental mode to use custom tools / MCP integrations
    model: "anthropic/claude-sonnet-4-5",
  });
  await stagehand.init();

  try {
    const page = stagehand.context.pages()[0];

    // Create a computer use agent
    const agent = stagehand.agent({
      mode: "cua",
      model: {
        modelName: "anthropic/claude-sonnet-4-5-20250929",
        apiKey: process.env.ANTHROPIC_API_KEY,
      },
      systemPrompt: `You are a helpful assistant that can use a web browser.
      You are currently on the following page: ${page.url()}.
      Do not ask follow up questions, the user will trust your judgement. Today's date is ${new Date().toLocaleDateString()}.`,
      tools: {
        getWeather, // Pass the tools to the agent
      },
    });

    // const agent = stagehand.agent({
    //   systemPrompt: `You are a helpful assistant that can use a web browser.
    //   You are currently on the following page: ${page.url()}.
    //   Do not ask follow up questions, the user will trust your judgement. Today's date is ${new Date().toLocaleDateString()}.`,
    //   // Pass the tools to the agent
    //   tools: {
    //     getWeather: getWeather,
    //   },
    // });

    // Navigate to the Browserbase careers page
    await page.goto("https://www.google.com");

    // Define the instruction for the CUA
    const instruction = "What's the weather in San Francisco?";
    console.log(`Instruction: ${chalk.white(instruction)}`);

    // Execute the instruction
    const result = await agent.execute({
      instruction,
      maxSteps: 20,
    });

    console.log(`${chalk.green("✓")} Execution complete`);
    console.log(`${chalk.yellow("⤷")} Result:`);
    console.log(chalk.white(JSON.stringify(result, null, 2)));
  } catch (error) {
    console.log(`${chalk.red("✗")} Error: ${error}`);
    if (error instanceof Error && error.stack) {
      console.log(chalk.dim(error.stack.split("\n").slice(1).join("\n")));
    }
  } finally {
    // Close the browser
    await stagehand.close();
  }
}

main().catch((error) => {
  console.log(`${chalk.red("✗")} Unhandled error in main function`);
  console.log(chalk.red(error));
});


================================================
FILE: packages/core/examples/agent_stream_example.ts
================================================
import { Stagehand } from "../lib/v3/index.js";
import chalk from "chalk";

// Load environment variables
async function main() {
  console.log(`\n${chalk.bold("Stagehand 🤘 Agent Streaming Example")}\n`);
  // Initialize Stagehand
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    cacheDir: "stagehand-agent-cache",
    logInferenceToFile: false,
    experimental: true,
  });

  await stagehand.init();

  try {
    const page = stagehand.context.pages()[0];
    await page.goto("https://amazon.com");

    // Create a streaming agent with stream: true in the config
    const agent = stagehand.agent({
      model: "anthropic/claude-sonnet-4-5-20250929",
      stream: true, // This makes execute() return AgentStreamResult
    });

    const agentRun = await agent.execute({
      instruction: "go to amazon, and search for shampoo, stop after searching",
      maxSteps: 20,
    });
    // stream the text
    for await (const delta of agentRun.textStream) {
      process.stdout.write(delta);
    }
    // stream everything ( toolcalls, messages, etc.)
    // for await (const delta of result.fullStream) {
    //   console.log(delta);
    // }

    const finalResult = await agentRun.result;
    console.log("Final Result:", finalResult);
  } catch (error) {
    console.log(`${chalk.red("✗")} Error: ${error}`);
  }
}
main();


================================================
FILE: packages/core/examples/cua-example.ts
================================================
/**
 * This example shows how to use a computer use agent (CUA) to navigate a web page and extract data.
 *
 * To learn more about the CUA, see: https://docs.stagehand.dev/examples/computer_use
 *
 * NOTE: YOU MUST CONFIGURE BROWSER DIMENSIONS TO USE COMPUTER USE!
 * Check out stagehand.config.ts for more information.
 */
import { Stagehand } from "../lib/v3/index.js";
import chalk from "chalk";

async function main() {
  console.log(
    `\n${chalk.bold("Stagehand 🤘 Computer Use Agent (CUA) Demo")}\n`,
  );

  // Initialize Stagehand
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 2,
  });
  await stagehand.init();

  try {
    const page = stagehand.context.pages()[0];

    // Create a computer use agent
    const agent = stagehand.agent({
      mode: "cua",
      model: {
        modelName: "google/gemini-3-flash-preview",
        apiKey: process.env.GEMINI_API_KEY ?? process.env.GOOGLE_API_KEY,
      },
      systemPrompt: `You are a helpful assistant that can use a web browser.
      You are currently on the following page: ${page.url()}.
      Do not ask follow up questions, the user will trust your judgement. Today's date is ${new Date().toLocaleDateString()}.`,
    });

    // Navigate to the Browserbase careers page
    await page.goto("https://www.browserbase.com/careers");

    // Define the instruction for the CUA
    const instruction =
      "Apply for the first engineer position with mock data. Don't submit the form. You're on the right page";
    console.log(`Instruction: ${chalk.white(instruction)}`);

    // Execute the instruction
    const result = await agent.execute({
      instruction,
      maxSteps: 20,
    });
    await new Promise((resolve) => setTimeout(resolve, 30000));

    console.log(`${chalk.green("✓")} Execution complete`);
    console.log(`${chalk.yellow("⤷")} Result:`);
    console.log(chalk.white(JSON.stringify(result, null, 2)));
  } catch (error) {
    console.log(`${chalk.red("✗")} Error: ${error}`);
    if (error instanceof Error && error.stack) {
      console.log(chalk.dim(error.stack.split("\n").slice(1).join("\n")));
    }
  } finally {
    // Close the browser
    await stagehand.close();
  }
}

main().catch((error) => {
  console.log(`${chalk.red("✗")} Unhandled error in main function`);
  console.log(chalk.red(error));
});


================================================
FILE: packages/core/examples/custom_client_aisdk.ts
================================================
/**
 * This example shows how to use the Vercel AI SDK to power the Stagehand LLM Client.
 *
 * You will need to reference the AI SDK Client in /external_clients/aisdk.ts
 *
 * To learn more about the Vercel AI SDK, see: https://sdk.vercel.ai/docs
 */
import { Stagehand } from "../lib/v3/index.js";
import { AISdkClient } from "./external_clients/aisdk.js";
import { z } from "zod";
import { openai } from "@ai-sdk/openai";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    llmClient: new AISdkClient({
      model: openai("gpt-4o"),
    }),
  });

  await stagehand.init();
  const page = stagehand.context.pages()[0];

  await page.goto("https://news.ycombinator.com");

  const { story } = await stagehand.extract(
    "extract the title of the top story on the page",
    z.object({
      story: z.string().describe("the top story on the page"),
    }),
  );

  console.log("The top story is:", story);
  await stagehand.act("click the first story");

  await stagehand.close();
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/custom_client_langchain.ts
================================================
/**
 * This example shows how to use the Langchain client with Stagehand.
 *
 * You will need to reference the Langchain Client in /external_clients/langchain.ts
 */
import { z } from "zod";
import { Stagehand } from "../lib/v3/index.js";
import { LangchainClient } from "./external_clients/langchain.js";
import { ChatOpenAI } from "@langchain/openai";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    llmClient: new LangchainClient(
      new ChatOpenAI({
        model: "gpt-4o",
      }),
    ),
  });
  await stagehand.init();
  const page = stagehand.context.pages()[0];
  await page.goto("https://news.ycombinator.com");
  const { story } = await stagehand.extract(
    "extract the title of the top story on the page",
    z.object({
      story: z.string().describe("the top story on the page"),
    }),
  );
  console.log("The top story is:", story);
  await stagehand.act("click the first story");
  await stagehand.close();
}
(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/custom_client_openai.ts
================================================
/**
 * This example shows how to use a custom OpenAI client with Stagehand.
 *
 * The OpenAI API provides a simple, type-safe, and composable way to build AI applications.
 *
 * You will need to reference the Custom OpenAI Client in /external_clients/customOpenAI.ts
 */
import { Stagehand } from "../lib/v3/index.js";
import { z } from "zod";
import { CustomOpenAIClient } from "./external_clients/customOpenAI.js";
import OpenAI from "openai";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    llmClient: new CustomOpenAIClient({
      modelName: "gpt-4o-mini",
      client: new OpenAI({
        apiKey: process.env.OPENAI_API_KEY,
      }),
    }),
  });
  await stagehand.init();

  const page = stagehand.context.pages()[0];
  await page.goto("https://news.ycombinator.com");
  await stagehand.act("click on the 'new' link");

  const headlines = await stagehand.extract(
    "Extract the top 3 stories from the Hacker News homepage.",
    z.object({
      stories: z.array(
        z.object({
          title: z.string(),
          url: z.string(),
          points: z.number(),
        }),
      ),
    }),
  );

  console.log(headlines);

  await stagehand.close();
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/example.ts
================================================
import { Stagehand } from "../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  /**
   * Add your code here!
   */
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-hn/",
  );

  const { extraction } = await stagehand.extract(
    "grab the the first title from inside the iframe",
  );
  console.log(extraction);

  const page2 = await stagehand.context.newPage();
  await page2.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-same-proc/",
  );
  await stagehand.extract(
    "extract the placeholder text on the your name field",
    { page: page2 },
  );
  await stagehand.act("fill the your name field with the text 'John Doe'", {
    page: page2,
  });
  const action2 = await stagehand.observe(
    "select blue as the favorite color on the dropdown",
    { page: page2 },
  );
  for (const action of action2) {
    await stagehand.act(action, { page: page2, timeout: 30_000 });
  }
}

(async () => {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    apiKey: process.env.BROWSERBASE_API_KEY,
    projectId: process.env.BROWSERBASE_PROJECT_ID,
    model: {
      modelName: "openai/gpt-5",
      apiKey: process.env.MODEL_API_KEY,
    },
    verbose: 2,
  });
  try {
    await stagehand.init();
    await example(stagehand);
  } finally {
    await stagehand.close();
  }
})();


================================================
FILE: packages/core/examples/external_clients/aisdk.ts
================================================
export { AISdkClient } from "../../lib/v3/external_clients/aisdk.js";


================================================
FILE: packages/core/examples/external_clients/customOpenAI.ts
================================================
export { CustomOpenAIClient } from "../../lib/v3/external_clients/customOpenAI.js";


================================================
FILE: packages/core/examples/external_clients/langchain.ts
================================================
import { BaseChatModel } from "@langchain/core/language_models/chat_models";
import {
  CreateChatCompletionOptions,
  LLMClient,
  AvailableModel,
} from "../../lib/v3/index.js";
import {
  AIMessage,
  BaseMessageLike,
  HumanMessage,
  SystemMessage,
} from "@langchain/core/messages";
import { ChatCompletion } from "openai/resources";
import { toJsonSchema } from "../../lib/v3/zodCompat.js";

export class LangchainClient extends LLMClient {
  public type = "langchainClient" as const;
  private model: BaseChatModel;

  constructor(model: BaseChatModel) {
    super(model.name as AvailableModel);
    this.model = model;
  }

  async createChatCompletion<T = ChatCompletion>({
    options,
  }: CreateChatCompletionOptions): Promise<T> {
    const formattedMessages: BaseMessageLike[] = options.messages.map(
      (message) => {
        if (Array.isArray(message.content)) {
          if (message.role === "system") {
            return new SystemMessage(
              message.content
                .map((c) => ("text" in c ? c.text : ""))
                .join("\n"),
            );
          }

          const content = message.content.map((content) =>
            "image_url" in content
              ? { type: "image", image: content.image_url.url }
              : { type: "text", text: content.text },
          );

          if (message.role === "user") return new HumanMessage({ content });

          const textOnlyParts = content.map((part) => ({
            type: "text" as const,
            text: part.type === "image" ? "[Image]" : part.text,
          }));

          return new AIMessage({ content: textOnlyParts });
        }

        return {
          role: message.role,
          content: message.content,
        };
      },
    );

    if (options.response_model) {
      //ref string no longer needed, this is now default behavior
      const responseSchema = toJsonSchema(options.response_model.schema);
      const structuredModel = this.model.withStructuredOutput(responseSchema);
      const response = await structuredModel.invoke(formattedMessages);

      return {
        data: response,
        usage: {
          prompt_tokens: 0, // Langchain doesn't provide token counts by default
          completion_tokens: 0,
          total_tokens: 0,
        },
      } as T;
    }

    const modelWithTools = this.model.bindTools(options.tools);
    const response = await modelWithTools.invoke(formattedMessages);

    return {
      data: response,
      usage: {
        prompt_tokens: 0, // Langchain doesn't provide token counts by default
        completion_tokens: 0,
        total_tokens: 0,
      },
    } as T;
  }
}


================================================
FILE: packages/core/examples/form_filling_sensible.ts
================================================
/**
 * This example shows you how to use observe() to get a cacheable Playwright action as JSON, then pass that JSON to act() to perform the action.
 *
 * In this specific example, we use observe() to get multiple actions, then iterate through each action to fill the form with sensitive data at lightning speed.
 */
import { Stagehand } from "../lib/v3/index.js";
import chalk from "chalk";

async function formFillingSensible() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
  });
  await stagehand.init();
  const page = stagehand.context.pages()[0];

  // Go to the website and wait for it to load
  await page.goto("https://file.1040.com/estimate/", {
    waitUntil: "networkidle",
    timeoutMs: 30000,
  });

  // Observe the form fields with suggested actions
  const observed = await stagehand.observe(
    "fill all the form fields in the page with mock data. In the description include the field name",
  );

  // Uncomment the following snippet to see the stagehand candidate suggestions (initial)
  console.log(
    `${chalk.green("Observe:")} Form fields found:\n${observed
      .map((r) => `${chalk.yellow(r.description)} -> ${chalk.gray(r.selector)}`)
      .join("\n")}`,
  );

  // Create a mapping of 1+ keywords in the form fields to standardize field names
  const mapping = (description: string): string | null => {
    const keywords: { [key: string]: string[] } = {
      age: ["old"],
      dependentsUnder17: ["under age 17", "child", "minor"],
      dependents17to23: ["17-23", "school", "student"],
      wages: ["wages", "W-2 Box 1"],
      federalTax: ["federal tax", "Box 2"],
      stateTax: ["state tax", "Box 17"],
    };

    for (const [key, terms] of Object.entries(keywords)) {
      if (terms.some((term) => description.toLowerCase().includes(term))) {
        return key;
      }
    }
    return null;
  };

  // Fill the form fields with sensible data. This data will only be used in your session and not be shared with LLM providers/external APIs.
  const userInputs: { [key: string]: string } = {
    age: "26",
    dependentsUnder17: "1",
    wages: "54321",
    federalTax: "8345",
    stateTax: "2222",
  };

  const updatedFields = observed.map((candidate) => {
    const key = mapping(candidate.description);
    if (key && userInputs[key]) {
      candidate.arguments = [userInputs[key]];
    }
    return candidate;
  });
  // List of sensible-data candidates
  console.log(
    `\n${chalk.green("Sensible Data form inputs:")} Form fields to be filled:\n${updatedFields
      .map(
        (r) =>
          `${chalk.yellow(r.description)} -> ${chalk.blue(r.arguments?.[0] || "no value")}`,
      )
      .join("\n")}`,
  );

  // Fill all the form fields with the sensible candidates
  for (const candidate of updatedFields) {
    await stagehand.act(candidate);
  }
}

(async () => {
  await formFillingSensible();
})();


================================================
FILE: packages/core/examples/google_enter.ts
================================================
/**
 * This example shows how to use the Stagehand agent to navigate to Google and search for "Browserbase".
 *
 * It's mainly meant to sanity check using page.act() to press enter, since some LLMs have issues with it.
 */

import { Stagehand } from "../lib/v3/index.js";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
  });
  await stagehand.init();
  const page = stagehand.context.pages()[0];
  await page.goto("https://google.com");
  await stagehand.act("type in 'Browserbase'");
  await stagehand.act("press enter");
  await stagehand.close();
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/instructions.ts
================================================
/**
 * This example shows how to use custom system prompts with Stagehand.
 */
import { Stagehand } from "../lib/v3/index.js";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    systemPrompt:
      "if the users says `secret12345`, click on the 'getting started' tab. additionally, if the user says to type something, translate their input into french and type it.",
  });
  await stagehand.init();

  const page = stagehand.context.pages()[0];
  await page.goto("https://docs.browserbase.com/");

  await stagehand.act("secret12345");

  await stagehand.act("search for 'how to use browserbase'");

  await stagehand.close();
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/integrations/exa.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto("https://www.google.com");

  const agent = stagehand.agent({
    integrations: [
      `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
    ],
    // Optional: Add custom instructions
    systemPrompt: `You are a helpful assistant that can use a browser as well as external tools such as web search.
    You have access to the Exa search tool to find information on the web.
    When looking for products to buy, make sure to search for current and reliable information.
    Be thorough in your research before making purchase decisions.`,
  });

  const result = await agent.execute(
    "Use one of the tools from Exa to search for the top headphones of 2025. After doing so, use the browser and go through the checkout flow for the best one.",
  );

  console.log(result);
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    model: "openai/gpt-4.1",
    verbose: 1,
    logInferenceToFile: true,
    experimental: true,
  });

  try {
    await stagehand.init();
    await example(stagehand);
  } catch (error) {
    console.error("Error running example:", error);
  } finally {
    await stagehand.close();
  }
})();


================================================
FILE: packages/core/examples/integrations/supabase.ts
================================================
import { connectToMCPServer, Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto("https://www.opentable.com/");

  const supabaseClient = await connectToMCPServer(
    `https://server.smithery.ai/@supabase-community/supabase-mcp/mcp?api_key=${process.env.SMITHERY_API_KEY}`,
  );

  const agent = stagehand.agent({
    model: "openai/computer-use-preview",
    integrations: [supabaseClient],
  });

  const result = await agent.execute(
    "Search for restaurants in New Brunswick, NJ. Then, use the Supabase tools to insert the name of the first result of the search into a table called 'restaurants'.",
  );

  console.log(result);
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 1,
  });

  try {
    await stagehand.init();
    await example(stagehand);
  } catch (error) {
    console.error("Error running example:", error);
  } finally {
    await stagehand.close();
  }
})();


================================================
FILE: packages/core/examples/mcp.ts
================================================
// import { Stagehand } from "../lib/v3";
// import StagehandConfig from "@/stagehand.config";
// import chalk from "chalk";
// import { connectToMCPServer } from "../lib/mcp/connection";

// async function main() {
//   console.log(`\n${chalk.bold("Stagehand 🤘 MCP Demo")}\n`);
//   console.log(process.env.NOTION_TOKEN);

//   // Initialize Stagehand
//   const stagehand = new Stagehand({
//     ...StagehandConfig,
//     env: "LOCAL",
//     experimental: true,
//   });
//   await stagehand.init();

//   const notionClient = await connectToMCPServer({
//     command: "npx",
//     args: ["-y", "@notionhq/notion-mcp-server"],
//     env: {
//       NOTION_TOKEN: process.env.NOTION_TOKEN,
//     },
//   });

//   try {
//     const page = stagehand.page;

//     // Create a computer use agent
//     const agent = stagehand.agent({
//       provider: "anthropic",
//       // For Anthropic, use claude-sonnet-4-6 or claude-sonnet-4-5-20250929
//       model: "claude-sonnet-4-6",
//       instructions: `You are a helpful assistant that can use a web browser.
//       You are currently on the following page: ${page.url()}.
//       Do not ask follow up questions, the user will trust your judgement.
//       You have access to the Notion MCP.`,
//       options: {
//         apiKey: process.env.ANTHROPIC_API_KEY,
//       },
//       integrations: [notionClient],
//     });

//     // Navigate to the Browserbase careers page
//     await page.goto("https://www.google.com");

//     // Define the instruction for the CUA
//     const instruction =
//       "Check the Agent Tasks page in notion, read your tasks, perform them and update the notion page with the results.";
//     console.log(`Instruction: ${chalk.white(instruction)}`);

//     // Execute the instruction
//     const result = await agent.execute({
//       instruction,
//       maxSteps: 50,
//     });

//     console.log(`${chalk.green("✓")} Execution complete`);
//     console.log(`${chalk.yellow("⤷")} Result:`);
//     console.log(chalk.white(JSON.stringify(result, null, 2)));
//   } catch (error) {
//     console.log(`${chalk.red("✗")} Error: ${error}`);
//     if (error instanceof Error && error.stack) {
//       console.log(chalk.dim(error.stack.split("\n").slice(1).join("\n")));
//     }
//   } finally {
//     // Close the browser
//     await stagehand.close();
//   }
// }

// main().catch((error) => {
//   console.log(`${chalk.red("✗")} Unhandled error in main function`);
//   console.log(chalk.red(error));
// });


================================================
FILE: packages/core/examples/operator-example.ts
================================================
/**
 * This example shows how to use the Stagehand operator to do simple autonomous tasks.
 *
 * This is built off of our open source project, Open Operator: https://operator.browserbase.com
 *
 * To learn more about Stagehand Agents, see: https://docs.stagehand.dev/concepts/agent
 */
import { Stagehand } from "../lib/v3/index.js";
import chalk from "chalk";

// Load environment variables

async function main() {
  console.log(`\n${chalk.bold("Stagehand 🤘 Operator Example")}\n`);
  // Initialize Stagehand
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 2,
    cacheDir: "stagehand-agent-cache",
    logInferenceToFile: false,
  });

  await stagehand.init();

  try {
    const page = stagehand.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/shadow-dom/",
    );
    const agent = stagehand.agent();

    const result = await agent.execute({
      instruction: "click the button",
      maxSteps: 20,
    });

    console.log(`${chalk.green("✓")} Execution complete`);
    console.log(`${chalk.yellow("⤷")} Result:`);
    console.log(JSON.stringify(result, null, 2));
    console.log(chalk.white(result.message));
  } catch (error) {
    console.log(`${chalk.red("✗")} Error: ${error}`);
  } finally {
    // await stagehand.close();
  }
}
main();


================================================
FILE: packages/core/examples/oss-cua-example.ts
================================================
/**
 * This example shows how to use a computer use agent (CUA) to navigate a web page and extract data.
 *
 * To learn more about the CUA, see: https://docs.stagehand.dev/examples/computer_use
 *
 * NOTE: YOU MUST CONFIGURE BROWSER DIMENSIONS TO USE COMPUTER USE!
 * Check out stagehand.config.ts for more information.
 */
import { Stagehand } from "../lib/v3/index.js";
import chalk from "chalk";

async function main() {
  console.log(
    `\n${chalk.bold("Stagehand 🤘 Computer Use Agent (CUA) Demo")}\n`,
  );

  // Initialize Stagehand
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 2,
    localBrowserLaunchOptions: {
      viewport: {
        width: 1288,
        height: 711,
      },
      deviceScaleFactor: 1,
    },
  });
  await stagehand.init();

  try {
    const page = stagehand.context.pages()[0];

    // Create a computer use agent
    const agent = stagehand.agent({
      mode: "cua",
      model: {
        modelName: "microsoft/fara-7b",
        apiKey: process.env.AZURE_API_KEY,
        baseURL: process.env.AZURE_ENDPOINT,
        /** Alternative model configuration for Fireworks Deployments */
        // modelName: "accounts/...",
        // apiKey: process.env.FIREWORKS_API_KEY,
        // baseURL: "https://api.fireworks.ai/inference/v1",
        // provider: "microsoft", // Important: this routes to the MicrosoftCUAClient
      },
      systemPrompt: `You are a helpful assistant that can use a web browser.
      You are currently on the following page: ${page.url()}.
      Do not ask follow up questions, the user will trust your judgement. Today's date is ${new Date().toLocaleDateString()}. Remember apply buttons are there for a reason.`,
    });

    // Navigate to the Browserbase careers page
    await page.goto("https://www.browserbase.com/careers");

    // Define the instruction for the CUA
    const instruction = `Apply for the first engineer position with mock data on the ${page.url()} page. Don't submit the form.`;
    console.log(`Instruction: ${chalk.white(instruction)}`);

    // Execute the instruction
    const result = await agent.execute({
      instruction,
      maxSteps: 20,
    });
    await new Promise((resolve) => setTimeout(resolve, 30000));

    console.log(`${chalk.green("✓")} Execution complete`);
    console.log(`${chalk.yellow("⤷")} Result:`);
    console.log(chalk.white(JSON.stringify(result, null, 2)));
  } catch (error) {
    console.log(`${chalk.red("✗")} Error: ${error}`);
    if (error instanceof Error && error.stack) {
      console.log(chalk.dim(error.stack.split("\n").slice(1).join("\n")));
    }
  } finally {
    // Close the browser
    await stagehand.close();
  }
}

main().catch((error) => {
  console.log(`${chalk.red("✗")} Unhandled error in main function`);
  console.log(chalk.red(error));
});


================================================
FILE: packages/core/examples/parameterizeApiKey.ts
================================================
import { Stagehand } from "../lib/v3/index.js";
import { z } from "zod";

/**
 * This example shows how to parameterize the API key for the LLM provider.
 *
 * In order to best demonstrate, unset the OPENAI_API_KEY environment variable and
 * set the USE_OPENAI_API_KEY environment variable to your OpenAI API key.
 *
 * export USE_OPENAI_API_KEY=$OPENAI_API_KEY
 * unset OPENAI_API_KEY
 */

async function example() {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 1,
    model: {
      modelName: "gpt-4o",
      apiKey: process.env.USE_OPENAI_API_KEY,
    },
  });

  await stagehand.init();
  const page = stagehand.context.pages()[0];
  await page.goto("https://github.com/browserbase/stagehand");
  await stagehand.act("click on the contributors");
  const contributor = await stagehand.extract(
    "extract the top contributor",
    z.object({
      username: z.string(),
      url: z.string(),
    }),
  );
  console.log(`Our favorite contributor is ${contributor.username}`);
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/examples/persist_logs_example.ts
================================================
/**
 * Example: Run a Stagehand agent and persist structured logging events to a user-specified dir.
 */
import path from "node:path";
import { Stagehand } from "../lib/v3/index.js";

async function main() {
  const logsRoot = path.resolve(process.cwd(), "examples", "logs");
  process.env.BROWSERBASE_CONFIG_DIR = logsRoot;

  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 1,
  });

  await stagehand.init();

  try {
    const page = stagehand.context.pages()[0];
    await page.goto("https://www.google.com");

    const agent = stagehand.agent();
    await agent.execute({
      instruction:
        "Search for Browserbase and stop after the results are visible.",
      maxSteps: 10,
    });
  } finally {
    // All logs can be found at logs/sessions/$SESSION_ID/session.json, or agent_events.log etc
    await stagehand.close();
  }
}

main().catch((error) => {
  console.error(error);
  process.exitCode = 1;
});


================================================
FILE: packages/core/examples/tsconfig.json
================================================
{
  "extends": "../tsconfig.json",
  "include": ["*.ts"],
  "exclude": ["node_modules"]
}


================================================
FILE: packages/core/examples/v3/cuaReplay.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";
import { v3Logger } from "../../lib/v3/logger.js";

async function runDemo(runNumber: number) {
  const startTime = Date.now();

  v3Logger({
    level: 1,
    category: "demo",
    message: `RUN ${runNumber}: ${runNumber === 1 ? "BUILDING CACHE" : "USING CACHE"}`,
  });

  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    disableAPI: false,
    verbose: 1,
    cacheDir: "cua-agent-cache",
  });

  await stagehand.init();

  const page = stagehand.context.pages()[0];

  await page.goto("https://v0-modern-login-flow.vercel.app/", {
    waitUntil: "networkidle",
  });

  const agent = stagehand.agent({
    mode: "cua",
    model: {
      modelName: "anthropic/claude-sonnet-4-20250514",
      apiKey: process.env.ANTHROPIC_API_KEY!,
    },
  });

  const result = await agent.execute({
    instruction: `Sign in with the email address 'test@browserbaser.com' and the password 'stagehand=goated'`,
    maxSteps: 20,
  });

  const endTime = Date.now();
  const duration = (endTime - startTime) / 1000;

  await stagehand.close();

  return {
    duration,
    success: result.success,
    result,
  };
}

async function main() {
  const metrics1 = await runDemo(1);

  v3Logger({
    level: 1,
    category: "demo",
    message: "⏳ Waiting 2 seconds before cached run...",
  });
  await new Promise((resolve) => setTimeout(resolve, 2000));

  v3Logger({
    level: 1,
    category: "demo",
    message: "Starting second run with cache...",
  });
  const metrics2 = await runDemo(2);

  const duration1 = `${metrics1.duration.toFixed(2)}s`;
  const duration2 = `${metrics2.duration.toFixed(2)}s`;

  v3Logger({
    level: 1,
    category: "demo",
    message: `
╔════════════════════════════════════════════════════════════╗
║                  📊 PERFORMANCE COMPARISON                 ║
╚════════════════════════════════════════════════════════════╝

┌─────────────────────┬──────────────────┬──────────────────┐
│     Metric          │   Run 1 (Cold)   │  Run 2 (Cached)  │
├─────────────────────┼──────────────────┼──────────────────┤
│ Duration            │ ${duration1.padEnd(16)} │ ${duration2.padEnd(16)} │
└─────────────────────┴──────────────────┴──────────────────┘

 Performance Comparison:
   • Speed: ${((1 - metrics2.duration / metrics1.duration) * 100).toFixed(1)}% faster with cache
   • Time saved: ${(metrics1.duration - metrics2.duration).toFixed(2)} seconds

 Insights:
   • First run establishes the CUA action cache
   • Second run reuses cached actions for instant execution
   • Zero LLM tokens used on cached run`,
  });
}

main().catch(console.error);


================================================
FILE: packages/core/examples/v3/deepLocator.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
  );

  // crossing OOPIF & shadow root boundaries with deep locator
  await page
    .deepLocator(
      "/html/body/shadow-host//section/iframe/html/body/main/section[1]/form/div/div[1]/input",
    )
    .fill("nunya");
  await page
    .deepLocator(
      "/html/body/shadow-host//section/iframe/html/body/main/section[1]/form/div/div[2]/input",
    )
    .fill("business");
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "openai/gpt-4.1",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/dropdown.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/scroll-dropdown/",
  );

  const actResult = await stagehand.act(
    "choose 'Peach' from the favorite colour dropdown",
  );

  const numSteps = actResult.actions.length;

  console.log(
    `\n\nThis act() call took ${numSteps} steps. Here are the actions:`,
  );

  for (const action of actResult.actions) {
    console.log(`\naction: `, action);
  }
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "google/gemini-2.5-flash",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/highlight.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/closed-shadow-root-in-oopif/",
  );

  await page
    .deepLocator(
      "xpath=/html/body/main/section/iframe/html/body/shadow-demo//div/button",
    )
    .highlight({
      durationMs: 20000,
      contentColor: { r: 255, g: 0, b: 0 },
    });
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "google/gemini-2.5-flash",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/patchright.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";
import { chromium } from "patchright-core";
import { z } from "zod";

async function example(stagehand: Stagehand) {
  const browser = await chromium.connectOverCDP({
    wsEndpoint: stagehand.connectURL(),
  });

  const prContext = browser.contexts()[0];
  const prPage = prContext.pages()[0];
  await prPage.goto("https://github.com/microsoft/playwright/issues/30261");

  await stagehand.act("scroll to the bottom of the page", { page: prPage });

  const reason = await stagehand.extract(
    "extract the reason why playwright doesn't expose frame IDs",
    z.string(),
    // page arg not required
  );
  console.log(reason);
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "openai/gpt-4.1",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/playwright.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";
import { chromium } from "playwright-core";
import { z } from "zod";

async function example(stagehand: Stagehand) {
  const browser = await chromium.connectOverCDP({
    wsEndpoint: stagehand.connectURL(),
  });
  const pwContext = browser.contexts()[0];
  const pwPage1 = pwContext.pages()[0];
  await pwPage1.goto("https://docs.stagehand.dev/first-steps/introduction");

  const pwPage2 = await pwContext.newPage();
  await pwPage2.goto("https://docs.stagehand.dev/configuration/observability");

  const [page1Extraction, page2Extraction] = await Promise.all([
    stagehand.extract(
      "extract the names of the four stagehand primitives",
      z.array(z.string()),
      { page: pwPage1 },
    ),
    stagehand.extract(
      "extract the list of session dashboard features",
      z.array(z.string()),
      { page: pwPage2 },
    ),
  ]);

  console.log(page1Extraction);
  console.log(page2Extraction);
}

(async () => {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    model: "openai/gpt-4.1",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/puppeteer.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";
import puppeteer from "puppeteer-core";

async function example(stagehand: Stagehand) {
  const browser = await puppeteer.connect({
    browserWSEndpoint: stagehand.connectURL(),
    defaultViewport: null,
  });
  const ppPages = await browser.pages();
  const ppPage = ppPages[0];

  await ppPage.goto("https://www.browserbase.com/blog");

  const actions = await stagehand.observe("find the next page button", {
    page: ppPage,
  });

  await stagehand.act(actions[0]);
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "openai/gpt-4.1",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/recordVideo.ts
================================================
import path from "node:path";
import { mkdir } from "node:fs/promises";
import { Stagehand } from "../../lib/v3/index.js";
import { chromium } from "playwright-core";
import { z } from "zod";

async function recordPlaywrightVideo(stagehand: Stagehand): Promise<void> {
  const browser = await chromium.connectOverCDP({
    wsEndpoint: stagehand.connectURL(),
  });

  const videoDir = path.resolve(process.cwd(), "artifacts", "stagehand-videos");
  await mkdir(videoDir, { recursive: true });

  const context = await browser.newContext({
    recordVideo: {
      dir: videoDir,
      size: { width: 1280, height: 720 },
    },
  });

  const page = await context.newPage();
  await page.goto("https://docs.stagehand.dev/first-steps/quickstart", {
    waitUntil: "domcontentloaded",
  });

  await stagehand.act("click the introduction div in the first steps section");

  const { primitives } = await stagehand.extract(
    "list the four Stagehand primitives that are described on the page",
    z.object({
      primitives: z.array(z.string()),
    }),
    { page },
  );

  console.log("Stagehand primitives:", primitives.join(", "));

  // Capture the handle before closing the context so we can read the video path afterwards.
  const video = page.video();

  await context.close();

  if (video) {
    const videoPath = await video.path();
    console.log(`Playwright saved the video to ${videoPath}`);
  } else {
    console.log("Video recording was not enabled for this context.");
  }
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 1,
    model: "google/gemini-2.5-flash",
  });

  try {
    await stagehand.init();
    await recordPlaywrightVideo(stagehand);
  } finally {
    await stagehand.close().catch(() => {});
  }
})();


================================================
FILE: packages/core/examples/v3/returnXpath.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
  );

  const xpath = await page.click(286, 628, { returnXpath: true });

  // use the xpath that was returned from out coord click
  await page.deepLocator(xpath).fill("hellooooooooo");
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "openai/gpt-4.1",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/shadowRoot.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://browserbase.github.io/stagehand-eval-sites/sites/shadow-dom-closed/",
  );

  // clicking in closed mode shadow root with an xpath
  await page.locator("/html/body/shadow-demo//div/button").click();

  await new Promise((resolve) => setTimeout(resolve, 3000));

  await page.reload();
  await new Promise((resolve) => setTimeout(resolve, 3000));

  // clicking in closed mode shadow root with css selector
  await page.locator("div > button").click();
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "openai/gpt-4.1",
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/targetedExtract.ts
================================================
import { Stagehand } from "../../lib/v3/index.js";
import { z } from "zod";

async function example(stagehand: Stagehand) {
  const page = stagehand.context.pages()[0];
  await page.goto(
    "https://ambarc.github.io/web-element-test/stagehand-breaking-test.html",
  );

  await page
    .deepLocator("/html/body/div[2]/div[3]/iframe/html/body/p")
    .highlight({
      durationMs: 5000,
      contentColor: { r: 255, g: 0, b: 0 },
    });

  const reason = await stagehand.extract(
    "extract the reason why script injection fails",
    z.string(),
    // selector: "// body > div.test-container > div:nth-child(3) > iframe >> body > p:nth-child(3)",
    { selector: "/html/body/div[2]/div[3]/iframe/html/body/p[2]" },
  );
  console.log(reason);
}

(async () => {
  const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 0,
    model: "openai/gpt-4.1",
    logInferenceToFile: true,
  });
  await stagehand.init();
  await example(stagehand);
})();


================================================
FILE: packages/core/examples/v3/v3_agent.ts
================================================
import chalk from "chalk";
import { V3 } from "../../lib/v3/index.js";

const INSTRUCTION = "scroll down and click on the last hn story";

async function main() {
  console.log(`\n${chalk.bold("Stagehand V3 🤘 Operator Example")}\n`);

  // Initialize Stagehand
  const v3 = new V3({
    env: "LOCAL",
    verbose: 2,
  });

  await v3.init();

  try {
    const startPage = v3.context.pages()[0];
    await startPage.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-hn/",
    );
    const agent = v3.agent({
      cua: false,
      model: "google/gemini-2.0-flash",
      executionModel: "google/gemini-2.0-flash",
    });
    // {
    //   model: "computer-use-preview-2025-03-11",
    //   provider: "openai",
    // }

    // Execute the agent
    console.log(`${chalk.cyan("↳")} Instruction: ${INSTRUCTION}`);
    const result = await agent.execute({
      instruction: INSTRUCTION,
      maxSteps: 20,
    });

    console.log(`${chalk.green("✓")} Execution complete`);
    console.log(`${chalk.yellow("⤷")} Result:`);
    console.log(JSON.stringify(result, null, 2));
    console.log(chalk.white(result.message));
  } catch (error) {
    console.log(`${chalk.red("✗")} Error: ${error}`);
  } finally {
    // await v3.close();
  }
}

main();


================================================
FILE: packages/core/examples/v3_example.ts
================================================
import { V3 } from "../lib/v3/index.js";
import { z } from "zod";

async function example(v3: V3) {
  const page = v3.context.pages()[0];
  await page.goto("https://www.apartments.com/san-francisco-ca/2-bedrooms/", {
    waitUntil: "load",
  });
  const apartment_listings = await v3.extract(
    "Extract all the apartment listings with their prices and their addresses.",
    z.object({
      listings: z.array(
        z.object({
          price: z.string().describe("The price of the listing"),
          address: z.string().describe("The address of the listing"),
        }),
      ),
    }),
  );

  const listings = apartment_listings.listings;
  console.log(listings);
  console.log(`found ${listings.length} listings`);
}

(async () => {
  const v3 = new V3({
    env: "LOCAL",
    verbose: 2,
    logInferenceToFile: false,
    model: "google/gemini-2.0-flash",
    cacheDir: "stagehand-extract-cache",
  });
  await v3.init();
  await example(v3);
})();


================================================
FILE: packages/core/examples/wordle.ts
================================================
import { Stagehand } from "../lib/v3/index.js";

async function example() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
  });
  await stagehand.init();
  const page = stagehand.context.pages()[0];
  await page.goto("https://www.nytimes.com/games/wordle/index.html");
  await stagehand.act("click 'Continue'");
  await stagehand.act("click 'Play'");
  await stagehand.act("click cross sign on top right of 'How To Play' card");
  const word = "WORDS";
  for (const letter of word) {
    await stagehand.act(`press ${letter}`);
  }
  await stagehand.act("press enter");
  await stagehand.close();
}

(async () => {
  await example();
})();


================================================
FILE: packages/core/lib/CHANGELOG.md
================================================
# @browserbasehq/stagehand-lib

## 2.4.1

### Patch Changes

- [#1027](https://github.com/browserbase/stagehand/pull/1027) [`455b61f`](https://github.com/browserbase/stagehand/commit/455b61fb6f7a34ae50d7e7c76c1d639241e213d6) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - Fixed small issue with module-level state guard for the Playwright selectors.register call

## 2.4.0

### Minor Changes

- [#778](https://github.com/browserbase/stagehand/pull/778) [`df570b6`](https://github.com/browserbase/stagehand/commit/df570b67e46febcaf7282ffb65dd5707e2808152) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - iframe support

### Patch Changes

- [#809](https://github.com/browserbase/stagehand/pull/809) [`03ebebc`](https://github.com/browserbase/stagehand/commit/03ebebc0317f92d8de77285cc2e66dc0131fe9fe) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - log NoObjectGenerated error details

- [#801](https://github.com/browserbase/stagehand/pull/801) [`1d4f0ab`](https://github.com/browserbase/stagehand/commit/1d4f0abca47bf47ae8b7aeb53f3cd1155a7e5448) Thanks [@miguelg719](https://github.com/miguelg719)! - Default use API to true

- [#798](https://github.com/browserbase/stagehand/pull/798) [`d86200b`](https://github.com/browserbase/stagehand/commit/d86200bd5bde4c5ba113ca89e28ab86c14a8304e) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix pino logging memory leak by reusing worker

## 2.3.0

### Minor Changes

- [#731](https://github.com/browserbase/stagehand/pull/731) [`393c8e0`](https://github.com/browserbase/stagehand/commit/393c8e05d016086e481c0043ee6b084c61886cad) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - make extract() with no arguments return the hybrid tree instead of text-rendered webpage

- [#737](https://github.com/browserbase/stagehand/pull/737) [`6ef6073`](https://github.com/browserbase/stagehand/commit/6ef60730cab0ad9025f44b6eeb2c83751d1dcd35) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - deprecate useTextExtract and remove functionality

### Patch Changes

- [#741](https://github.com/browserbase/stagehand/pull/741) [`5680d25`](https://github.com/browserbase/stagehand/commit/5680d2509352c383ad502c9f4fabde01fa638833) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - use safeparse for zod validation

- [#740](https://github.com/browserbase/stagehand/pull/740) [`28840a7`](https://github.com/browserbase/stagehand/commit/28840a7d3fec89a490984582fb37fa3d007c0349) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - dont log deprecation warning when onlyVisible is undefined

- [#755](https://github.com/browserbase/stagehand/pull/755) [`ba687ab`](https://github.com/browserbase/stagehand/commit/ba687abdfb598f839ddfec0442d3d7b6b696b0a3) Thanks [@miguelg719](https://github.com/miguelg719)! - Fix context init error on undefined context

- [#789](https://github.com/browserbase/stagehand/pull/789) [`c5ff8ce`](https://github.com/browserbase/stagehand/commit/c5ff8ce2d7467b70a450ca52bc3e03b15280ce1b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix noisy useTextExtract deprecation log

- [#757](https://github.com/browserbase/stagehand/pull/757) [`628e534`](https://github.com/browserbase/stagehand/commit/628e534ea6d7ca081bad6c32167c7d53d4772eed) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - optimize CDP calls when building hybrid tree

- [#772](https://github.com/browserbase/stagehand/pull/772) [`64d331d`](https://github.com/browserbase/stagehand/commit/64d331dc2eba86675a8b148d361897f55f170703) Thanks [@miguelg719](https://github.com/miguelg719)! - Fixes an issue with the new tab intercepts for invalid urls

- [#770](https://github.com/browserbase/stagehand/pull/770) [`d312a43`](https://github.com/browserbase/stagehand/commit/d312a43672fe2865abcf184a712a759a12f5b9d1) Thanks [@miguelg719](https://github.com/miguelg719)! - Removed default chromium flags that delay browser launching

- [#753](https://github.com/browserbase/stagehand/pull/753) [`fbca400`](https://github.com/browserbase/stagehand/commit/fbca4003a547dc5eee0c0be5edc5e98c1f4d8c22) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix `stagehand.history`

- [#745](https://github.com/browserbase/stagehand/pull/745) [`c54afab`](https://github.com/browserbase/stagehand/commit/c54afab0e43a2144eecbc56df7f33c5e444ceed5) Thanks [@miguelg719](https://github.com/miguelg719)! - Add an identifier for client language/runtime

- [#768](https://github.com/browserbase/stagehand/pull/768) [`58b06eb`](https://github.com/browserbase/stagehand/commit/58b06eb2fdfb1a9cd84c03f46655ab0ea00ee07f) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix: page.evaluate: Execution context was destroyed, most likely because of a navigation

- [#758](https://github.com/browserbase/stagehand/pull/758) [`98e1356`](https://github.com/browserbase/stagehand/commit/98e13566846a547003e4c9aebbe4f95eff653bba) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - rm unused functions

- [#781](https://github.com/browserbase/stagehand/pull/781) [`8d239ce`](https://github.com/browserbase/stagehand/commit/8d239cec7a835d35243b2b00c3c00c1b66c05b5e) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix variable parsing issue with gpt-4.1

- [#761](https://github.com/browserbase/stagehand/pull/761) [`e1f7074`](https://github.com/browserbase/stagehand/commit/e1f7074be23c82ae897386d5e5e132ff8cb4120a) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - build xpaths on node side instead of using injected JS

## 2.2.1

### Patch Changes

- [#729](https://github.com/browserbase/stagehand/pull/729) [`fc24f84`](https://github.com/browserbase/stagehand/commit/fc24f848ee0f300182e88993dfe8d68025d69fcb) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - fix "failed to inject helper scripts" log on stagehand.close()


================================================
FILE: packages/core/lib/inference.ts
================================================
import { z } from "zod";
import { LogLine } from "./v3/types/public/logs.js";
import { ChatMessage, LLMClient } from "./v3/llm/LLMClient.js";
import { getEnvTimeoutMs, withTimeout } from "./v3/timeoutConfig.js";
import {
  buildActSystemPrompt,
  buildExtractSystemPrompt,
  buildExtractUserPrompt,
  buildMetadataPrompt,
  buildMetadataSystemPrompt,
  buildObserveSystemPrompt,
  buildObserveUserMessage,
} from "./prompt.js";
import { appendSummary, writeTimestampedTxtFile } from "./inferenceLogUtils.js";
import type {
  InferStagehandSchema,
  StagehandZodObject,
} from "./v3/zodCompat.js";
import { SupportedUnderstudyAction } from "./v3/types/private/handlers.js";

// Re-export for backward compatibility
export type { LLMParsedResponse, LLMUsage } from "./v3/llm/LLMClient.js";

function withLlmTimeout<T>(promise: Promise<T>, operation: string): Promise<T> {
  return withTimeout(
    promise,
    getEnvTimeoutMs("LLM_MAX_MS"),
    `LLM ${operation}`,
  );
}

export async function extract<T extends StagehandZodObject>({
  instruction,
  domElements,
  schema,
  llmClient,
  logger,
  userProvidedInstructions,
  logInferenceToFile = false,
}: {
  instruction: string;
  domElements: string;
  schema: T;
  llmClient: LLMClient;
  userProvidedInstructions?: string;
  logger: (message: LogLine) => void;
  logInferenceToFile?: boolean;
}) {
  const metadataSchema = z.object({
    progress: z
      .string()
      .describe(
        "progress of what has been extracted so far, as concise as possible",
      ),
    completed: z
      .boolean()
      .describe(
        "true if the goal is now accomplished. Use this conservatively, only when sure that the goal has been completed.",
      ),
  });

  type ExtractionResponse = InferStagehandSchema<T>;
  type MetadataResponse = z.infer<typeof metadataSchema>;

  const isUsingAnthropic = llmClient.type === "anthropic";
  const isGPT5 = llmClient.modelName.includes("gpt-5"); // TODO: remove this as we update support for gpt-5 configuration options

  const extractCallMessages: ChatMessage[] = [
    buildExtractSystemPrompt(isUsingAnthropic, userProvidedInstructions),
    buildExtractUserPrompt(instruction, domElements, isUsingAnthropic),
  ];

  let extractCallFile = "";
  let extractCallTimestamp = "";
  if (logInferenceToFile) {
    const { fileName, timestamp } = writeTimestampedTxtFile(
      "extract_summary",
      "extract_call",
      {
        modelCall: "extract",
        messages: extractCallMessages,
      },
    );
    extractCallFile = fileName;
    extractCallTimestamp = timestamp;
  }

  const extractStartTime = Date.now();
  const extractionResponse = await withLlmTimeout(
    llmClient.createChatCompletion<ExtractionResponse>({
      options: {
        messages: extractCallMessages,
        response_model: {
          schema,
          name: "Extraction",
        },
        temperature: isGPT5 ? 1 : 0.1,
        top_p: 1,
        frequency_penalty: 0,
        presence_penalty: 0,
      },
      logger,
    }),
    "extract",
  );
  const extractEndTime = Date.now();

  const { data: extractedData, usage: extractUsage } = extractionResponse;

  let extractResponseFile: string;
  if (logInferenceToFile) {
    const { fileName } = writeTimestampedTxtFile(
      "extract_summary",
      "extract_response",
      {
        modelResponse: "extract",
        rawResponse: extractedData,
      },
    );
    extractResponseFile = fileName;

    appendSummary("extract", {
      extract_inference_type: "extract",
      timestamp: extractCallTimestamp,
      LLM_input_file: extractCallFile,
      LLM_output_file: extractResponseFile,
      prompt_tokens: extractUsage?.prompt_tokens ?? 0,
      completion_tokens: extractUsage?.completion_tokens ?? 0,
      reasoning_tokens: extractUsage?.reasoning_tokens ?? 0,
      cached_input_tokens: extractUsage?.cached_input_tokens ?? 0,
      inference_time_ms: extractEndTime - extractStartTime,
    });
  }

  const metadataCallMessages: ChatMessage[] = [
    buildMetadataSystemPrompt(),
    buildMetadataPrompt(instruction, extractedData),
  ];

  let metadataCallFile = "";
  let metadataCallTimestamp = "";
  if (logInferenceToFile) {
    const { fileName, timestamp } = writeTimestampedTxtFile(
      "extract_summary",
      "metadata_call",
      {
        modelCall: "metadata",
        messages: metadataCallMessages,
      },
    );
    metadataCallFile = fileName;
    metadataCallTimestamp = timestamp;
  }

  const metadataStartTime = Date.now();
  const metadataResponse = await withLlmTimeout(
    llmClient.createChatCompletion<MetadataResponse>({
      options: {
        messages: metadataCallMessages,
        response_model: {
          name: "Metadata",
          schema: metadataSchema,
        },
        temperature: isGPT5 ? 1 : 0.1,
        top_p: 1,
        frequency_penalty: 0,
        presence_penalty: 0,
      },
      logger,
    }),
    "extract metadata",
  );
  const metadataEndTime = Date.now();

  const {
    data: {
      completed: metadataResponseCompleted,
      progress: metadataResponseProgress,
    },
    usage: metadataResponseUsage,
  } = metadataResponse;

  let metadataResponseFile: string;
  if (logInferenceToFile) {
    const { fileName } = writeTimestampedTxtFile(
      "extract_summary",
      "metadata_response",
      {
        modelResponse: "metadata",
        completed: metadataResponseCompleted,
        progress: metadataResponseProgress,
      },
    );
    metadataResponseFile = fileName;

    appendSummary("extract", {
      extract_inference_type: "metadata",
      timestamp: metadataCallTimestamp,
      LLM_input_file: metadataCallFile,
      LLM_output_file: metadataResponseFile,
      prompt_tokens: metadataResponseUsage?.prompt_tokens ?? 0,
      completion_tokens: metadataResponseUsage?.completion_tokens ?? 0,
      reasoning_tokens: metadataResponseUsage?.reasoning_tokens ?? 0,
      cached_input_tokens: metadataResponseUsage?.cached_input_tokens ?? 0,
      inference_time_ms: metadataEndTime - metadataStartTime,
    });
  }

  const totalPromptTokens =
    (extractUsage?.prompt_tokens ?? 0) +
    (metadataResponseUsage?.prompt_tokens ?? 0);

  const totalCompletionTokens =
    (extractUsage?.completion_tokens ?? 0) +
    (metadataResponseUsage?.completion_tokens ?? 0);

  const totalInferenceTimeMs =
    extractEndTime - extractStartTime + (metadataEndTime - metadataStartTime);
  const totalReasoningTokens =
    (extractUsage?.reasoning_tokens ?? 0) +
    (metadataResponseUsage?.reasoning_tokens ?? 0);
  const totalCachedInputTokens =
    (extractUsage?.cached_input_tokens ?? 0) +
    (metadataResponseUsage?.cached_input_tokens ?? 0);

  return {
    ...extractedData,
    metadata: {
      completed: metadataResponseCompleted,
      progress: metadataResponseProgress,
    },
    prompt_tokens: totalPromptTokens,
    completion_tokens: totalCompletionTokens,
    reasoning_tokens: totalReasoningTokens,
    cached_input_tokens: totalCachedInputTokens,
    inference_time_ms: totalInferenceTimeMs,
  };
}

export async function observe({
  instruction,
  domElements,
  llmClient,
  userProvidedInstructions,
  logger,
  logInferenceToFile = false,
  supportedActions,
}: {
  instruction: string;
  domElements: string;
  llmClient: LLMClient;
  userProvidedInstructions?: string;
  logger: (message: LogLine) => void;
  logInferenceToFile?: boolean;
  supportedActions?: string[];
}) {
  const isGPT5 = llmClient.modelName.includes("gpt-5"); // TODO: remove this as we update support for gpt-5 configuration options

  const observeSchema = z.object({
    elements: z
      .array(
        z.object({
          elementId: z
            .string()
            .regex(/^\d+-\d+$/)
            .describe(
              "the ID string associated with the element. Never include surrounding square brackets. This field must follow the format of 'number-number'.",
            ),
          description: z
            .string()
            .describe(
              "a description of the accessible element and its purpose",
            ),
          method: z
            .enum(
              // Use Object.values() for Zod v3 compatibility - z.enum() in v3 doesn't accept TypeScript enums directly
              Object.values(SupportedUnderstudyAction) as unknown as readonly [
                string,
                ...string[],
              ],
            )
            .describe(
              `the candidate method/action to interact with the element. Select one of the available Understudy interaction methods.`,
            ),
          arguments: z.array(
            z
              .string()
              .describe(
                "the arguments to pass to the method. For example, for a click, the arguments are empty, but for a fill, the arguments are the value to fill in.",
              ),
          ),
        }),
      )
      .describe("an array of accessible elements that match the instruction"),
  });

  type ObserveResponse = z.infer<typeof observeSchema>;

  const messages: ChatMessage[] = [
    buildObserveSystemPrompt(userProvidedInstructions, supportedActions),
    buildObserveUserMessage(instruction, domElements),
  ];

  let callTimestamp = "";
  let callFile = "";
  if (logInferenceToFile) {
    const { fileName, timestamp } = writeTimestampedTxtFile(
      `observe_summary`,
      `observe_call`,
      {
        modelCall: "observe",
        messages,
      },
    );
    callFile = fileName;
    callTimestamp = timestamp;
  }

  const start = Date.now();
  const rawResponse = await llmClient.createChatCompletion<ObserveResponse>({
    options: {
      messages,
      response_model: {
        schema: observeSchema,
        name: "Observation",
      },
      temperature: isGPT5 ? 1 : 0.1,
      top_p: 1,
      frequency_penalty: 0,
      presence_penalty: 0,
    },
    logger,
  });
  const end = Date.now();
  const usageTimeMs = end - start;

  const { data: observeData, usage: observeUsage } = rawResponse;
  const promptTokens = observeUsage?.prompt_tokens ?? 0;
  const completionTokens = observeUsage?.completion_tokens ?? 0;
  const reasoningTokens = observeUsage?.reasoning_tokens ?? 0;
  const cachedInputTokens = observeUsage?.cached_input_tokens ?? 0;

  let responseFile: string;
  if (logInferenceToFile) {
    const { fileName: responseFileName } = writeTimestampedTxtFile(
      `observe_summary`,
      `observe_response`,
      {
        modelResponse: "observe",
        rawResponse: observeData,
      },
    );
    responseFile = responseFileName;

    appendSummary("observe", {
      [`observe_inference_type`]: "observe",
      timestamp: callTimestamp,
      LLM_input_file: callFile,
      LLM_output_file: responseFile,
      prompt_tokens: promptTokens,
      completion_tokens: completionTokens,
      reasoning_tokens: reasoningTokens,
      cached_input_tokens: cachedInputTokens,
      inference_time_ms: usageTimeMs,
    });
  }

  const parsedElements =
    observeData.elements?.map((el) => {
      const base = {
        elementId: el.elementId,
        description: String(el.description),
        method: String(el.method),
        arguments: el.arguments,
      };
      return base;
    }) ?? [];

  return {
    elements: parsedElements,
    prompt_tokens: promptTokens,
    completion_tokens: completionTokens,
    reasoning_tokens: reasoningTokens,
    cached_input_tokens: cachedInputTokens,
    inference_time_ms: usageTimeMs,
  };
}

export async function act({
  instruction,
  domElements,
  llmClient,
  userProvidedInstructions,
  logger,
  logInferenceToFile = false,
}: {
  instruction: string;
  domElements: string;
  llmClient: LLMClient;
  userProvidedInstructions?: string;
  logger: (message: LogLine) => void;
  logInferenceToFile?: boolean;
}) {
  const isGPT5 = llmClient.modelName.includes("gpt-5"); // TODO: remove this as we update support for gpt-5 configuration options

  const actSchema = z.object({
    elementId: z
      .string()
      .regex(/^\d+-\d+$/)
      .describe(
        "the ID string associated with the element. Never include surrounding square brackets. This field must follow the format of 'number-number'.",
      ),
    description: z
      .string()
      .describe("a description of the accessible element and its purpose"),
    method: z
      .enum(
        // Use Object.values() for Zod v3 compatibility - z.enum() in v3 doesn't accept TypeScript enums directly
        Object.values(SupportedUnderstudyAction) as unknown as readonly [
          string,
          ...string[],
        ],
      )
      .describe(
        "the candidate method/action to interact with the element. Select one of the available Understudy interaction methods.",
      ),
    arguments: z.array(
      z
        .string()
        .describe(
          "the arguments to pass to the method. For example, for a click, the arguments are empty, but for a fill, the arguments are the value to fill in.",
        ),
    ),
    twoStep: z.boolean(),
  });

  type ActResponse = z.infer<typeof actSchema>;

  const messages: ChatMessage[] = [
    buildActSystemPrompt(userProvidedInstructions),
    buildObserveUserMessage(instruction, domElements),
  ];

  let callTimestamp = "";
  let callFile = "";
  if (logInferenceToFile) {
    const { fileName, timestamp } = writeTimestampedTxtFile(
      `act_summary`,
      `act_call`,
      {
        modelCall: "act",
        messages,
      },
    );
    callFile = fileName;
    callTimestamp = timestamp;
  }

  const start = Date.now();
  const rawResponse = await llmClient.createChatCompletion<ActResponse>({
    options: {
      messages,
      response_model: {
        schema: actSchema,
        name: "act",
      },
      temperature: isGPT5 ? 1 : 0.1,
      top_p: 1,
      frequency_penalty: 0,
      presence_penalty: 0,
    },
    logger,
  });
  const end = Date.now();
  const usageTimeMs = end - start;

  const { data: actData, usage: actUsage } = rawResponse;
  const promptTokens = actUsage?.prompt_tokens ?? 0;
  const completionTokens = actUsage?.completion_tokens ?? 0;
  const reasoningTokens = actUsage?.reasoning_tokens ?? 0;
  const cachedInputTokens = actUsage?.cached_input_tokens ?? 0;

  let responseFile: string;
  if (logInferenceToFile) {
    const { fileName: responseFileName } = writeTimestampedTxtFile(
      `act_summary`,
      `act_response`,
      {
        modelResponse: "act",
        rawResponse: actData,
      },
    );
    responseFile = responseFileName;

    appendSummary("act", {
      [`act_inference_type`]: "act",
      timestamp: callTimestamp,
      LLM_input_file: callFile,
      LLM_output_file: responseFile,
      prompt_tokens: promptTokens,
      completion_tokens: completionTokens,
      reasoning_tokens: reasoningTokens,
      cached_input_tokens: cachedInputTokens,
      inference_time_ms: usageTimeMs,
    });
  }

  const parsedElement = {
    elementId: actData.elementId,
    description: String(actData.description),
    method: String(actData.method),
    arguments: actData.arguments,
  };

  return {
    element: parsedElement,
    prompt_tokens: promptTokens,
    completion_tokens: completionTokens,
    reasoning_tokens: reasoningTokens,
    cached_input_tokens: cachedInputTokens,
    inference_time_ms: usageTimeMs,
    twoStep: actData.twoStep,
  };
}


================================================
FILE: packages/core/lib/inferenceLogUtils.ts
================================================
import fs from "fs";
import path from "path";

/**
 * Create (or ensure) a parent directory named "inference_summary".
 */
function ensureInferenceSummaryDir(): string {
  const inferenceDir = path.join(process.cwd(), "inference_summary");
  if (!fs.existsSync(inferenceDir)) {
    fs.mkdirSync(inferenceDir, { recursive: true });
  }
  return inferenceDir;
}

/**
 * Appends a new entry to the act_summary.json file, then writes the file back out.
 */
export function appendSummary<T>(inferenceType: string, entry: T) {
  const summaryPath = getSummaryJsonPath(inferenceType);
  const arrayKey = `${inferenceType}_summary`;

  const existingData = readSummaryFile<T>(inferenceType);
  existingData[arrayKey].push(entry);

  fs.writeFileSync(summaryPath, JSON.stringify(existingData, null, 2));
}

/** A simple timestamp utility for filenames. */
function getTimestamp(): string {
  return new Date()
    .toISOString()
    .replace(/[^0-9T]/g, "")
    .replace("T", "_");
}

/**
 * Writes `data` as JSON into a file in `directory`, using a prefix plus timestamp.
 * Returns both the file name and the timestamp used, so you can log them.
 */
export function writeTimestampedTxtFile(
  directory: string,
  prefix: string,
  data: unknown,
): { fileName: string; timestamp: string } {
  const baseDir = ensureInferenceSummaryDir();

  const subDir = path.join(baseDir, directory);
  if (!fs.existsSync(subDir)) {
    fs.mkdirSync(subDir, { recursive: true });
  }

  const timestamp = getTimestamp();
  const fileName = `${timestamp}_${prefix}.txt`;
  const filePath = path.join(subDir, fileName);

  fs.writeFileSync(
    filePath,
    JSON.stringify(data, null, 2).replace(/\\n/g, "\n"),
  );

  return { fileName, timestamp };
}

/**
 * Returns the path to the `<inferenceType>_summary.json` file.
 *
 * For example, if `inferenceType = "act"`, this will be:
 *   `./inference_summary/act_summary/act_summary.json`
 */
function getSummaryJsonPath(inferenceType: string): string {
  const baseDir = ensureInferenceSummaryDir();
  const subDir = path.join(baseDir, `${inferenceType}_summary`);
  if (!fs.existsSync(subDir)) {
    fs.mkdirSync(subDir, { recursive: true });
  }
  return path.join(subDir, `${inferenceType}_summary.json`);
}

/**
 * Reads the `<inferenceType>_summary.json` file, returning an object
 * with the top-level array named `<inferenceType>_summary`, if it exists.
 *
 * E.g. if inferenceType is "act", we expect a shape like:
 * {
 *   "act_summary": [ ... ]
 * }
 *
 * If the file or array is missing, returns { "<inferenceType>_summary": [] }.
 */
function readSummaryFile<T>(inferenceType: string): Record<string, T[]> {
  const summaryPath = getSummaryJsonPath(inferenceType);

  // The top-level array key, e.g. "act_summary", "observe_summary", "extract_summary"
  const arrayKey = `${inferenceType}_summary`;

  if (!fs.existsSync(summaryPath)) {
    return { [arrayKey]: [] };
  }

  try {
    const raw = fs.readFileSync(summaryPath, "utf8");
    const parsed = JSON.parse(raw);
    if (
      parsed &&
      typeof parsed === "object" &&
      Array.isArray(parsed[arrayKey])
    ) {
      return parsed;
    }
  } catch {
    // If we fail to parse for any reason, fall back to empty array
  }
  return { [arrayKey]: [] };
}


================================================
FILE: packages/core/lib/logger.ts
================================================
import pino from "pino";
import { LogLine } from "./v3/types/public/logs.js";

// Map our existing levels to Pino's standard levels
const levelMapping: Record<number, pino.Level> = {
  0: "error", // Critical/important messages
  1: "info", // Standard information
  2: "debug", // Detailed debugging information
};

// Define configuration options
export interface LoggerOptions {
  pretty?: boolean;
  level?: pino.Level;
  destination?: pino.DestinationStream;
  usePino?: boolean; // Whether to use pino (default: true)
}

/**
 * Creates a configured Pino logger instance
 */
export function createLogger(options: LoggerOptions = {}) {
  const loggerConfig: pino.LoggerOptions = {
    level: options.level || "info",
    base: undefined, // Don't include pid and hostname
    browser: {
      asObject: true,
    },
    // Disable worker threads to avoid issues in tests
    transport: undefined,
  };

  // Add pretty printing for dev environments only if explicitly requested
  // and not in a test environment
  if (options.pretty && !isTestEnvironment()) {
    try {
      // Use require for dynamic import
      const transport = {
        transport: {
          target: "pino-pretty",
          options: {
            colorize: true,
            translateTime: "SYS:standard",
            ignore: "pid,hostname",
          },
        },
      };
      Object.assign(loggerConfig, transport);
    } catch {
      console.warn(
        "pino-pretty not available, falling back to standard logging",
      );
    }
  }

  return pino(loggerConfig, options.destination);
}

/**
 * Check if we're running in a test environment
 */
function isTestEnvironment(): boolean {
  return (
    process.env.NODE_ENV === "test" ||
    process.env.JEST_WORKER_ID !== undefined ||
    process.env.PLAYWRIGHT_TEST_BASE_DIR !== undefined ||
    // Check if we're in a CI environment
    process.env.CI === "true"
  );
}

/**
 * StagehandLogger class that wraps Pino for our specific needs
 *
 * LOGGING PRECEDENCE:
 *
 * Test environments:
 *   - External logger provided -> external logger only.
 *   - No external logger -> console fallback only (Pino disabled).
 *
 * Non-test environments:
 *   - usePino === true -> emit via Pino and also call the external logger when present.
 *   - usePino === false -> disable Pino; use the external logger when present, otherwise console fallback.
 *   - usePino === undefined -> prefer the external logger when present; otherwise use Pino.
 *
 * SHARED PINO OPTIMIZATION:
 * We maintain a single shared Pino instance when `usePino` is enabled.
 * This prevents spawning a new worker thread for every Stagehand instance
 * (which happens when `pino-pretty` transport is used), eliminating the
 * memory/RSS growth observed when many Stagehand objects are created and
 * disposed within the same process (e.g. a request-per-instance API).
 */
export class StagehandLogger {
  /**
   * Shared Pino logger instance across all StagehandLogger instances.
   * First instance to enable Pino creates it, subsequent instances reuse it.
   */
  private static sharedPinoLogger: pino.Logger | null = null;

  private logger?: pino.Logger;
  private verbose: 0 | 1 | 2;
  private externalLogger?: (logLine: LogLine) => void;
  private usePino: boolean;
  private isTest: boolean;

  constructor(
    options: LoggerOptions = {},
    externalLogger?: (logLine: LogLine) => void,
  ) {
    this.isTest = isTestEnvironment();
    this.externalLogger = externalLogger;

    const externalProvided = typeof externalLogger === "function";
    const explicitUsePino = options.usePino;

    if (this.isTest) {
      this.usePino = false;
    } else if (explicitUsePino === true) {
      this.usePino = true;
    } else if (explicitUsePino === false) {
      this.usePino = false;
    } else {
      this.usePino = !externalProvided;
    }

    if (this.usePino) {
      // Re-use (or create) a single shared Pino logger instance
      if (!StagehandLogger.sharedPinoLogger) {
        StagehandLogger.sharedPinoLogger = createLogger(options);
      }
      this.logger = StagehandLogger.sharedPinoLogger;
    }

    this.verbose = 1; // Default verbosity level
  }

  /**
   * Set the verbosity level
   */
  setVerbosity(level: 0 | 1 | 2) {
    this.verbose = level;

    if (this.usePino && this.logger) {
      // Map our verbosity levels to Pino log levels
      switch (level) {
        case 0:
          this.logger.level = "error";
          break;
        case 1:
          this.logger.level = "info";
          break;
        case 2:
          this.logger.level = "debug";
          break;
      }
    }
  }

  /**
   * Log a message using our LogLine format
   */
  log(logLine: LogLine): void {
    // Skip logs above verbosity level
    if ((logLine.level ?? 1) > this.verbose) {
      return;
    }

    // For test environments WITHOUT an external logger OR for cases where Pino
    // is disabled and no external logger is provided, fall back to console.* so
    // users still see logs (non-colourised).
    const shouldFallbackToConsole =
      (!this.usePino && !this.externalLogger) ||
      (this.isTest && !this.externalLogger);

    if (shouldFallbackToConsole) {
      const level = logLine.level ?? 1;
      const ts = logLine.timestamp ?? new Date().toISOString();
      const levelStr = level === 0 ? "ERROR" : level === 2 ? "DEBUG" : "INFO";

      // Format like Pino: [timestamp] LEVEL: message
      let output = `[${ts}] ${levelStr}: ${logLine.message}`;

      // Add auxiliary data on separate indented lines (like Pino pretty format)
      if (logLine.auxiliary) {
        const formattedData = this.formatAuxiliaryData(logLine.auxiliary);
        for (const [key, value] of Object.entries(formattedData)) {
          let formattedValue: string;
          if (typeof value === "object" && value !== null) {
            // Pretty print objects with indentation
            formattedValue = JSON.stringify(value, null, 2)
              .split("\n")
              .map((line, i) => (i === 0 ? line : `    ${line}`))
              .join("\n");
          } else {
            formattedValue = String(value);
          }
          output += `\n    ${key}: ${formattedValue}`;
        }
      }

      switch (level) {
        case 0:
          console.error(output);
          break;
        case 1:
          console.log(output);
          break;
        case 2:
          console.debug(output);
          break;
      }

      return; // already handled via console output, avoid duplicate logging
    }

    if (this.usePino && this.logger) {
      // Determine the Pino log level
      const pinoLevel = levelMapping[logLine.level ?? 1] || "info";

      // Structure the log data
      const logData = {
        category: logLine.category,
        timestamp: logLine.timestamp || new Date().toISOString(),
        ...this.formatAuxiliaryData(logLine.auxiliary),
      };

      // Log through Pino with the appropriate level
      if (pinoLevel === "error") {
        this.logger.error(logData, logLine.message);
      } else if (pinoLevel === "info") {
        this.logger.info(logData, logLine.message);
      } else if (pinoLevel === "debug") {
        this.logger.debug(logData, logLine.message);
      } else if (pinoLevel === "warn") {
        this.logger.warn(logData, logLine.message);
      } else if (pinoLevel === "trace") {
        this.logger.trace(logData, logLine.message);
      } else {
        this.logger.info(logData, logLine.message);
      }
    }

    // IMPORTANT: External logger receives logs ALWAYS when provided (takes precedence)
    // This ensures user-provided loggers (e.g., EvalLogger, custom loggers) capture all logs
    // regardless of Pino configuration. Pino is used for console output, external logger
    // is used for programmatic log capture.
    if (this.externalLogger) {
      this.externalLogger(logLine);
    }
  }

  /**
   * Helper to format auxiliary data for structured logging
   */
  private formatAuxiliaryData(auxiliary?: LogLine["auxiliary"]) {
    if (!auxiliary) return {};

    const formattedData: Record<string, unknown> = {};

    for (const [key, { value, type }] of Object.entries(auxiliary)) {
      let formattedValue: unknown;

      // Convert values based on their type
      switch (type) {
        case "integer":
          formattedValue = parseInt(value, 10);
          break;
        case "float":
          formattedValue = parseFloat(value);
          break;
        case "boolean":
          formattedValue = value === "true";
          break;
        case "object":
          try {
            formattedValue = JSON.parse(value);
          } catch {
            formattedValue = value;
          }
          break;
        default:
          formattedValue = value;
      }

      // Skip undefined values and empty objects/arrays
      if (formattedValue === undefined) continue;
      if (typeof formattedValue === "object" && formattedValue !== null) {
        const isEmpty = Array.isArray(formattedValue)
          ? formattedValue.length === 0
          : Object.keys(formattedValue).length === 0;
        if (isEmpty) continue;
      }

      formattedData[key] = formattedValue;
    }

    return formattedData;
  }

  /**
   * Convenience methods for different log levels
   */
  error(message: string, data?: Record<string, unknown>): void {
    this.log({
      message,
      level: 0,
      auxiliary: this.convertToAuxiliary(data),
    });
  }

  warn(message: string, data?: Record<string, unknown>): void {
    this.log({
      message,
      level: 1,
      category: "warning",
      auxiliary: this.convertToAuxiliary(data),
    });
  }

  info(message: string, data?: Record<string, unknown>): void {
    this.log({
      message,
      level: 1,
      auxiliary: this.convertToAuxiliary(data),
    });
  }

  debug(message: string, data?: Record<string, unknown>): void {
    this.log({
      message,
      level: 2,
      auxiliary: this.convertToAuxiliary(data),
    });
  }

  /**
   * Convert a plain object to our auxiliary format
   */
  private convertToAuxiliary(
    data?: Record<string, unknown>,
  ): LogLine["auxiliary"] {
    if (!data) return undefined;

    const auxiliary: LogLine["auxiliary"] = {};

    for (const [key, value] of Object.entries(data)) {
      if (value === undefined) continue;

      const type = typeof value;

      auxiliary[key] = {
        value: type === "object" ? JSON.stringify(value) : String(value),
        type:
          type === "number"
            ? Number.isInteger(value)
              ? "integer"
              : "float"
            : type === "boolean"
              ? "boolean"
              : type === "object"
                ? "object"
                : "string",
      };
    }

    return auxiliary;
  }
}


================================================
FILE: packages/core/lib/modelUtils.ts
================================================
import { ClientOptions, ModelConfiguration } from "./v3/types/public/model.js";
import {
  AVAILABLE_CUA_MODELS,
  AvailableCuaModel,
} from "./v3/types/public/agent.js";

//useful when resolving a model from string or object formats we accept
export function extractModelName(
  model?: string | { modelName: string; [key: string]: unknown },
): string | undefined {
  if (!model) return undefined;
  return typeof model === "string" ? model : model.modelName;
}

export function splitModelName(model: string): {
  provider: string;
  modelName: string;
} {
  const firstSlashIndex = model.indexOf("/");
  const provider = model.substring(0, firstSlashIndex);
  const modelName = model.substring(firstSlashIndex + 1);
  return { provider, modelName };
}

export function resolveModel(model: string | ModelConfiguration): {
  provider: string;
  modelName: string;
  clientOptions: ClientOptions;
  isCua: boolean;
} {
  const modelString = extractModelName(model)!;
  const clientOptions =
    typeof model === "string"
      ? {}
      : (() => {
          // eslint-disable-next-line @typescript-eslint/no-unused-vars
          const { modelName: _, ...rest } = model;
          return rest;
        })();

  // Check if provider is explicitly set in clientOptions
  const hasExplicitProvider = clientOptions.provider !== undefined;

  // If provider is explicitly set, don't split the model name - pass it through as-is
  let provider: string;
  let parsedModelName: string;

  if (hasExplicitProvider) {
    provider = clientOptions.provider as string;
    parsedModelName = modelString; // Keep the full model name
  } else {
    // Parse the model string normally
    const split = splitModelName(modelString);
    provider = split.provider;
    parsedModelName = split.modelName;
  }

  // Check if it's a CUA model
  const isCua =
    hasExplicitProvider ||
    AVAILABLE_CUA_MODELS.includes(modelString as AvailableCuaModel);

  return {
    provider,
    modelName: parsedModelName,
    clientOptions,
    isCua,
  };
}


================================================
FILE: packages/core/lib/prompt.ts
================================================
import { ChatMessage } from "./v3/llm/LLMClient.js";
import type { Variables } from "./v3/types/public/agent.js";

export function buildUserInstructionsString(
  userProvidedInstructions?: string,
): string {
  if (!userProvidedInstructions) {
    return "";
  }

  return `\n\n# Custom Instructions Provided by the User
    
Please keep the user's instructions in mind when performing actions. If the user's instructions are not relevant to the current task, ignore them.

User Instructions:
${userProvidedInstructions}`;
}

// extract
export function buildExtractSystemPrompt(
  isUsingPrintExtractedDataTool: boolean = false,
  userProvidedInstructions?: string,
): ChatMessage {
  const baseContent = `You are extracting content on behalf of a user.
  If a user asks you to extract a 'list' of information, or 'all' information, 
  YOU MUST EXTRACT ALL OF THE INFORMATION THAT THE USER REQUESTS.
   
  You will be given:
1. An instruction
2. `;

  const contentDetail = `A list of DOM elements to extract from.`;

  const instructions = `
Print the exact text from the DOM elements with all symbols, characters, and endlines as is.
Print null or an empty string if no new information is found.
  `.trim();

  const toolInstructions = isUsingPrintExtractedDataTool
    ? `
ONLY print the content using the print_extracted_data tool provided.
ONLY print the content using the print_extracted_data tool provided.
  `.trim()
    : "";

  const additionalInstructions =
    "If a user is attempting to extract links or URLs, you MUST respond with ONLY the IDs of the link elements. \n" +
    "Do not attempt to extract links directly from the text unless absolutely necessary. ";

  const userInstructions = buildUserInstructionsString(
    userProvidedInstructions,
  );

  const content =
    `${baseContent}${contentDetail}\n\n${instructions}\n${toolInstructions}${
      additionalInstructions ? `\n\n${additionalInstructions}` : ""
    }${userInstructions ? `\n\n${userInstructions}` : ""}`.replace(/\s+/g, " ");

  return {
    role: "system",
    content,
  };
}

export function buildExtractUserPrompt(
  instruction: string,
  domElements: string,
  isUsingPrintExtractedDataTool: boolean = false,
): ChatMessage {
  let content = `Instruction: ${instruction}
DOM: ${domElements}`;

  if (isUsingPrintExtractedDataTool) {
    content += `
ONLY print the content using the print_extracted_data tool provided.
ONLY print the content using the print_extracted_data tool provided.`;
  }

  return {
    role: "user",
    content,
  };
}

const metadataSystemPrompt = `You are an AI assistant tasked with evaluating the progress and completion status of an extraction task.
Analyze the extraction response and determine if the task is completed or if more information is needed.
Strictly abide by the following criteria:
1. Once the instruction has been satisfied by the current extraction response, ALWAYS set completion status to true and stop processing, regardless of remaining chunks.
2. Only set completion status to false if BOTH of these conditions are true:
   - The instruction has not been satisfied yet
   - There are still chunks left to process (chunksTotal > chunksSeen)`;

export function buildMetadataSystemPrompt(): ChatMessage {
  return {
    role: "system",
    content: metadataSystemPrompt,
  };
}

export function buildMetadataPrompt(
  instruction: string,
  extractionResponse: object,
): ChatMessage {
  return {
    role: "user",
    content: `Instruction: ${instruction}
Extracted content: ${JSON.stringify(extractionResponse, null, 2)}`,
  };
}

// observe
export function buildObserveSystemPrompt(
  userProvidedInstructions?: string,
  supportedActions?: string[],
): ChatMessage {
  const actionsString = supportedActions?.length
    ? `\n\nSupported actions: ${supportedActions.join(", ")}`
    : "";

  const observeSystemPrompt = `
You are helping the user automate the browser by finding elements based on what the user wants to observe in the page.

You will be given:
1. a instruction of elements to observe
2. a hierarchical accessibility tree showing the semantic structure of the page. The tree is a hybrid of the DOM and the accessibility tree.

Return an array of elements that match the instruction if they exist, otherwise return an empty array.
When returning elements, include the appropriate method from the supported actions list.${actionsString}. When choosing non-left click actions, provide right or middle as the argument.`;
  const content = observeSystemPrompt.replace(/\s+/g, " ");

  return {
    role: "system",
    content: [content, buildUserInstructionsString(userProvidedInstructions)]
      .filter(Boolean)
      .join("\n\n"),
  };
}

export function buildObserveUserMessage(
  instruction: string,
  domElements: string,
): ChatMessage {
  return {
    role: "user",
    content: `instruction: ${instruction}
Accessibility Tree: \n${domElements}\n`,
  };
}

export function buildActSystemPrompt(
  userProvidedInstructions?: string,
): ChatMessage {
  const actSystemPrompt = `
You are helping the user automate the browser by finding elements based on what action the user wants to take on the page

You will be given:
1. a user defined instruction about what action to take
2. a hierarchical accessibility tree showing the semantic structure of the page. The tree is a hybrid of the DOM and the accessibility tree.

Return the element that matches the instruction if it exists. Otherwise, return an empty object.`;
  const content = actSystemPrompt.replace(/\s+/g, " ");

  return {
    role: "system",
    content: [content, buildUserInstructionsString(userProvidedInstructions)]
      .filter(Boolean)
      .join("\n\n"),
  };
}

export function buildActPrompt(
  action: string,
  supportedActions: string[],
  variables?: Variables,
): string {
  // Base instruction
  let instruction = `Find the most relevant element to perform an action on given the following action: ${action}.  
  IF AND ONLY IF the action EXPLICITLY includes the word 'dropdown' and implies choosing/selecting an option from a dropdown, ignore the 'General Instructions' section, and follow the 'Dropdown Specific Instructions' section carefully.
  
  General Instructions: 
    Provide an action for this element such as ${supportedActions.join(", ")}. Remember that to users, buttons and links look the same in most cases.
    When choosing non-left click actions, provide right or middle as the argument
    If the action is completely unrelated to a potential action to be taken on the page, return an empty object. 
    ONLY return one action. If multiple actions are relevant, return the most relevant one. 
    If the user is asking to scroll to a position on the page, e.g., 'halfway' or 0.75, etc, you must return the argument formatted as the correct percentage, e.g., '50%' or '75%', etc.
    If the user is asking to scroll to the next chunk/previous chunk, choose the nextChunk/prevChunk method. No arguments are required here.
    If the action implies a key press, e.g., 'press enter', 'press a', 'press space', etc., always choose the press method with the appropriate key as argument — e.g. 'a', 'Enter', 'Space'. Do not choose a click action on an on-screen keyboard. Capitalize the first character like 'Enter', 'Tab', 'Escape' only for special keys. 
  
  Dropdown Specific Instructions:
    For interacting with dropdowns, there are two specific cases that you need to handle. 
    
    CASE 1: the element is a 'select' element. 
      - choose the selectOptionFromDropdown method,
      - set the argument to the exact text of the option that should be selected,
      - set twoStep to false.
    CASE 2: the element is NOT a 'select' element:
      - do not attempt to directly choose the element from the dropdown. You will need to click to expand the dropdown first. You will achieve this by following these instructions:
        - choose the node that most closely corresponds to the given instruction EVEN if it is a 'StaticText' element, or otherwise does not appear to be interactable.  
        - choose the 'click' method
        - set twoStep to true.
  `;

  // Add variable names (not values) to the instruction if any
  if (variables && Object.keys(variables).length > 0) {
    const variableNames = Object.keys(variables)
      .map((key) => `%${key}%`)
      .join(", ");
    const variablesPrompt = `The following variables are available to use in the action: ${variableNames}. Fill the argument variables with the variable name.`;
    instruction += ` ${variablesPrompt}`;
  }

  return instruction;
}

export function buildStepTwoPrompt(
  originalUserAction: string,
  previousAction: string,
  supportedActions: string[],
  variables?: Variables,
): string {
  // Base instruction
  let instruction = `
  The original user action was: ${originalUserAction}.
  You have just taken the following action which completed step 1 of 2: ${previousAction}.
  
  Now, you must find the most relevant element to perform an action on in order to complete step 2 of 2. 
  
  General Instructions: 
  Provide an action for this element such as ${supportedActions.join(", ")}. Remember that to users, buttons and links look the same in most cases.
  If the action is completely unrelated to a potential action to be taken on the page, return an empty object. 
  ONLY return one action. If multiple actions are relevant, return the most relevant one. 
  If the user is asking to scroll to a position on the page, e.g., 'halfway' or 0.75, etc, you must return the argument formatted as the correct percentage, e.g., '50%' or '75%', etc.
  If the user is asking to scroll to the next chunk/previous chunk, choose the nextChunk/prevChunk method. No arguments are required here.
  If the action implies a key press, e.g., 'press enter', 'press a', 'press space', etc., always choose the press method with the appropriate key as argument — e.g. 'a', 'Enter', 'Space'. Do not choose a click action on an on-screen keyboard. Capitalize the first character like 'Enter', 'Tab', 'Escape' only for special keys. 
  `;

  // Add variable names (not values) to the instruction if any
  if (variables && Object.keys(variables).length > 0) {
    const variableNames = Object.keys(variables)
      .map((key) => `%${key}%`)
      .join(", ");
    const variablesPrompt = `The following variables are available to use in the action: ${variableNames}. Fill the argument variables with the variable name.`;
    instruction += ` ${variablesPrompt}`;
  }

  return instruction;
}

export function buildOperatorSystemPrompt(goal: string): ChatMessage {
  return {
    role: "system",
    content: `You are a general-purpose agent whose job is to accomplish the user's goal across multiple model calls by running actions on the page.

You will be given a goal and a list of steps that have been taken so far. Your job is to determine if either the user's goal has been completed or if there are still steps that need to be taken.

# Your current goal
${goal}

# CRITICAL: You MUST use the provided tools to take actions. Do not just describe what you want to do - actually call the appropriate tools.

# Available tools and when to use them:
- \`act\`: Use this to interact with the page (click, type, navigate, etc.)
- \`extract\`: Use this to get information from the page
- \`goto\`: Use this to navigate to a specific URL
- \`wait\`: Use this to wait for a period of time
- \`navback\`: Use this to go back to the previous page
- \`refresh\`: Use this to refresh the current page
- \`close\`: Use this ONLY when the task is complete or cannot be achieved
- External tools: Use any additional tools (like search tools) as needed for your goal

# Important guidelines
1. ALWAYS use tools - never just provide text responses about what you plan to do
2. Break down complex actions into individual atomic steps
3. For \`act\` commands, use only one action at a time, such as:
   - Single click on a specific element
   - Type into a single input field
   - Select a single option
4. Avoid combining multiple actions in one instruction
5. If multiple actions are needed, they should be separate steps
6. Only use \`close\` when the task is genuinely complete or impossible to achieve`,
  };
}

export function buildCuaDefaultSystemPrompt(): string {
  return `You are a helpful assistant that can use a web browser.\nDo not ask follow up questions, the user will trust your judgement. Today's date is ${new Date().toISOString().split("T")[0]}.`;
}

export function buildGoogleCUASystemPrompt(): ChatMessage {
  return {
    role: "system",
    content: `You are a general-purpose browser agent whose job is to accomplish the user's goal.
Today's date is ${new Date().toISOString().split("T")[0]}.
You have access to a search tool; however, in most cases you should operate within the page/url the user has provided. ONLY use the search tool if you're stuck or the task is impossible to complete within the current page.
You will be given a goal and a list of steps that have been taken so far. Avoid requesting the user for input as much as possible. Good luck!
`,
  };
}


================================================
FILE: packages/core/lib/utils.ts
================================================
import { ZodSchemaValidationError } from "./v3/types/public/sdkErrors.js";
import { Schema, Type } from "@google/genai";
import { z, ZodTypeAny } from "zod";
import z3 from "zod/v3";
import { LogLine } from "./v3/types/public/logs.js";
import { ModelProvider } from "./v3/types/public/model.js";
import { ZodPathSegments } from "./v3/types/private/internal.js";
import type { StagehandZodSchema } from "./v3/zodCompat.js";
import { isZod4Schema } from "./v3/zodCompat.js";

const ID_PATTERN = /^\d+-\d+$/;

const zFactories = {
  v4: z,
  v3: z3 as unknown as typeof z,
};

export function getZFactory(schema: StagehandZodSchema): typeof z {
  return isZod4Schema(schema) ? zFactories.v4 : zFactories.v3;
}

const TYPE_NAME_MAP: Record<string, string> = {
  ZodString: "string",
  string: "string",
  ZodNumber: "number",
  number: "number",
  ZodBoolean: "boolean",
  boolean: "boolean",
  ZodObject: "object",
  object: "object",
  ZodArray: "array",
  array: "array",
  ZodUnion: "union",
  union: "union",
  ZodIntersection: "intersection",
  intersection: "intersection",
  ZodOptional: "optional",
  optional: "optional",
  ZodNullable: "nullable",
  nullable: "nullable",
  ZodLiteral: "literal",
  literal: "literal",
  ZodEnum: "enum",
  enum: "enum",
  ZodDefault: "default",
  default: "default",
  ZodEffects: "effects",
  effects: "effects",
  pipe: "pipe",
};

function getZ4Def(schema: StagehandZodSchema) {
  return (schema as SchemaInternals)._zod?.def as
    | Record<string, unknown>
    | undefined;
}

function getZ4Bag(schema: StagehandZodSchema) {
  return (schema as SchemaInternals)._zod?.bag as
    | Record<string, unknown>
    | undefined;
}

function getZ3Def(schema: StagehandZodSchema) {
  return (schema as SchemaInternals)._def as
    | Record<string, unknown>
    | undefined;
}

function getObjectShape(
  schema: StagehandZodSchema,
): Record<string, StagehandZodSchema> | undefined {
  const z4Shape = getZ4Def(schema)?.shape as
    | Record<string, StagehandZodSchema>
    | undefined;
  if (z4Shape) {
    return z4Shape;
  }

  const z3Shape = getZ3Def(schema)?.shape;
  if (!z3Shape) {
    return undefined;
  }

  if (typeof z3Shape === "function") {
    return (z3Shape as () => Record<string, StagehandZodSchema>)();
  }

  return z3Shape as Record<string, StagehandZodSchema>;
}

function getArrayElement(
  schema: StagehandZodSchema,
): StagehandZodSchema | undefined {
  return (getZ4Def(schema)?.element ?? getZ3Def(schema)?.type) as
    | StagehandZodSchema
    | undefined;
}

function getInnerType(
  schema: StagehandZodSchema,
): StagehandZodSchema | undefined {
  return (getZ4Def(schema)?.innerType ?? getZ3Def(schema)?.innerType) as
    | StagehandZodSchema
    | undefined;
}

function getUnionOptions(
  schema: StagehandZodSchema,
): StagehandZodSchema[] | undefined {
  const z4Options = getZ4Def(schema)?.options;
  if (Array.isArray(z4Options)) {
    return z4Options as StagehandZodSchema[];
  }
  const z3Options = getZ3Def(schema)?.options;
  return Array.isArray(z3Options)
    ? (z3Options as StagehandZodSchema[])
    : undefined;
}

function getIntersectionSides(schema: StagehandZodSchema): {
  left?: StagehandZodSchema;
  right?: StagehandZodSchema;
} {
  const z4Def = getZ4Def(schema);
  if (z4Def?.left || z4Def?.right) {
    return {
      left: z4Def?.left as StagehandZodSchema | undefined,
      right: z4Def?.right as StagehandZodSchema | undefined,
    };
  }
  const z3Def = getZ3Def(schema);
  return {
    left: z3Def?.left as StagehandZodSchema | undefined,
    right: z3Def?.right as StagehandZodSchema | undefined,
  };
}

function getEnumValues(schema: StagehandZodSchema): string[] | undefined {
  const z4Entries = getZ4Def(schema)?.entries;
  if (z4Entries && typeof z4Entries === "object") {
    return Object.values(z4Entries as Record<string, string>);
  }
  const z3Values = getZ3Def(schema)?.values;
  return Array.isArray(z3Values) ? (z3Values as string[]) : undefined;
}

function getLiteralValues(schema: StagehandZodSchema): unknown[] {
  const z4Values = getZ4Def(schema)?.values;
  if (Array.isArray(z4Values)) {
    return z4Values as unknown[];
  }
  const value = getZ3Def(schema)?.value;
  return typeof value !== "undefined" ? [value] : [];
}

function getStringChecks(schema: StagehandZodSchema): unknown[] {
  const z4Checks = getZ4Def(schema)?.checks;
  if (Array.isArray(z4Checks)) {
    return z4Checks;
  }
  const z3Checks = getZ3Def(schema)?.checks;
  return Array.isArray(z3Checks) ? z3Checks : [];
}

function getStringFormat(schema: StagehandZodSchema): string | undefined {
  const bagFormat = getZ4Bag(schema)?.format;
  if (typeof bagFormat === "string") {
    return bagFormat;
  }
  const z4Format = getZ4Def(schema)?.format;
  if (typeof z4Format === "string") {
    return z4Format;
  }
  const z3Format = getZ3Def(schema)?.format;
  return typeof z3Format === "string" ? z3Format : undefined;
}

function getPipeEndpoints(schema: StagehandZodSchema): {
  in?: StagehandZodSchema;
  out?: StagehandZodSchema;
} {
  const z4Def = getZ4Def(schema);
  if (z4Def?.in || z4Def?.out) {
    return {
      in: z4Def?.in as StagehandZodSchema | undefined,
      out: z4Def?.out as StagehandZodSchema | undefined,
    };
  }
  return {};
}

function getEffectsBaseSchema(
  schema: StagehandZodSchema,
): StagehandZodSchema | undefined {
  return getZ3Def(schema)?.schema as StagehandZodSchema | undefined;
}

type SchemaInternals = {
  _zod?: { def?: Record<string, unknown>; bag?: Record<string, unknown> };
  _def?: Record<string, unknown>;
};

export function validateZodSchema(schema: StagehandZodSchema, data: unknown) {
  const result = schema.safeParse(data);

  if (result.success) {
    return true;
  }
  throw new ZodSchemaValidationError(data, result.error.format());
}

/**
 * Detects if the code is running in the Bun runtime environment.
 * @returns {boolean} True if running in Bun, false otherwise.
 */
export function isRunningInBun(): boolean {
  return (
    typeof process !== "undefined" &&
    typeof process.versions !== "undefined" &&
    "bun" in process.versions
  );
}

/*
 * Helper functions for converting between Gemini and Zod schemas
 */
function decorateGeminiSchema(
  geminiSchema: Schema,
  zodSchema: z.ZodTypeAny,
): Schema {
  if (geminiSchema.nullable === undefined) {
    geminiSchema.nullable = zodSchema.isOptional();
  }

  if (zodSchema.description) {
    geminiSchema.description = zodSchema.description;
  }

  return geminiSchema;
}

export function toGeminiSchema(zodSchema: StagehandZodSchema): Schema {
  const normalizedSchema = zodSchema as z.ZodTypeAny;
  const zodType = getZodType(zodSchema);
  switch (zodType) {
    case "array": {
      const element = getArrayElement(zodSchema) ?? z.any();
      return decorateGeminiSchema(
        {
          type: Type.ARRAY,
          items: toGeminiSchema(element),
        },
        normalizedSchema,
      );
    }
    case "object": {
      const properties: Record<string, Schema> = {};
      const required: string[] = [];

      const shape = getObjectShape(zodSchema);
      if (shape) {
        Object.entries(shape).forEach(
          ([key, value]: [string, StagehandZodSchema]) => {
            properties[key] = toGeminiSchema(value);
            if (getZodType(value) !== "optional") {
              required.push(key);
            }
          },
        );
      }

      return decorateGeminiSchema(
        {
          type: Type.OBJECT,
          properties,
          required: required.length > 0 ? required : undefined,
        },
        normalizedSchema,
      );
    }
    case "string":
      return decorateGeminiSchema(
        {
          type: Type.STRING,
        },
        normalizedSchema,
      );
    case "number":
      return decorateGeminiSchema(
        {
          type: Type.NUMBER,
        },
        normalizedSchema,
      );
    case "boolean":
      return decorateGeminiSchema(
        {
          type: Type.BOOLEAN,
        },
        normalizedSchema,
      );
    case "enum": {
      const values = getEnumValues(zodSchema);
      return decorateGeminiSchema(
        {
          type: Type.STRING,
          enum: values,
        },
        normalizedSchema,
      );
    }
    case "default":
    case "nullable":
    case "optional": {
      const innerType = getInnerType(zodSchema) ?? z.any();
      const innerSchema = toGeminiSchema(innerType);
      return decorateGeminiSchema(
        {
          ...innerSchema,
          nullable: true,
        },
        normalizedSchema,
      );
    }
    case "literal": {
      const values = getLiteralValues(zodSchema);
      return decorateGeminiSchema(
        {
          type: Type.STRING,
          enum: values as string[],
        },
        normalizedSchema,
      );
    }
    case "pipe": {
      const endpoints = getPipeEndpoints(zodSchema);
      if (endpoints.in) {
        return toGeminiSchema(endpoints.in);
      }
      return decorateGeminiSchema(
        {
          type: Type.STRING,
        },
        normalizedSchema,
      );
    }
    // Standalone transforms and any unknown types fall through to default
    default:
      return decorateGeminiSchema(
        {
          type: Type.STRING,
        },
        normalizedSchema,
      );
  }
}

// Helper function to check the type of Zod schema
export function getZodType(schema: StagehandZodSchema): string {
  const schemaWithDef = schema as SchemaInternals & {
    _zod?: { def?: { type?: string } };
  };
  const rawType =
    (schemaWithDef._zod?.def?.type as string | undefined) ??
    (schemaWithDef._def?.typeName as string | undefined) ??
    (schemaWithDef._def?.type as string | undefined);

  if (!rawType) {
    return "unknown";
  }

  return TYPE_NAME_MAP[rawType] ?? rawType;
}

/**
 * Recursively traverses a given Zod schema, scanning for any fields of type `z.string().url()`.
 * For each such field, it replaces the `z.string().url()` with `z.number()`.
 *
 * This function is used internally by higher-level utilities (e.g., transforming entire object schemas)
 * and handles nested objects, arrays, unions, intersections, optionals.
 *
 * @param schema - The Zod schema to transform.
 * @param currentPath - An array of string/number keys representing the current schema path (used internally for recursion).
 * @returns A two-element tuple:
 *   1. The updated Zod schema, with any `.url()` fields replaced by `z.number()`.
 *   2. An array of {@link ZodPathSegments} objects representing each replaced field, including the path segments.
 */
export function transformSchema(
  schema: StagehandZodSchema,
  currentPath: Array<string | number>,
): [StagehandZodSchema, ZodPathSegments[]] {
  if (isKind(schema, "string")) {
    const checks = getStringChecks(schema);
    const format = getStringFormat(schema);
    const hasUrlCheck =
      checks.some((check) => {
        const candidate = check as {
          kind?: string;
          format?: string;
          _zod?: { def?: { check?: string; format?: string } };
        };
        return (
          candidate.kind === "url" ||
          candidate.format === "url" ||
          candidate._zod?.def?.check === "url" ||
          candidate._zod?.def?.format === "url"
        );
      }) || format === "url";

    if (hasUrlCheck) {
      return [makeIdStringSchema(schema), [{ segments: [] }]];
    }
    return [schema, []];
  }

  if (isKind(schema, "object")) {
    const shape = getObjectShape(schema);
    if (!shape) {
      return [schema, []];
    }
    const newShape: Record<string, StagehandZodSchema> = {};
    const urlPaths: ZodPathSegments[] = [];
    let changed = false;

    for (const key of Object.keys(shape)) {
      const child = shape[key];
      const [transformedChild, childPaths] = transformSchema(child, [
        ...currentPath,
        key,
      ]);
      if (transformedChild !== child) {
        changed = true;
      }
      newShape[key] = transformedChild;
      childPaths.forEach((cp) => {
        urlPaths.push({ segments: [key, ...cp.segments] });
      });
    }

    if (changed) {
      const factory = getZFactory(schema);
      return [
        factory.object(newShape as Record<string, z.ZodTypeAny>),
        urlPaths,
      ];
    }
    return [schema, urlPaths];
  }

  if (isKind(schema, "array")) {
    const itemType = getArrayElement(schema);
    if (!itemType) {
      return [schema, []];
    }
    const [transformedItem, childPaths] = transformSchema(itemType, [
      ...currentPath,
      "*",
    ]);
    const arrayPaths: ZodPathSegments[] = childPaths.map((cp) => ({
      segments: ["*", ...cp.segments],
    }));
    if (transformedItem !== itemType) {
      const factory = getZFactory(schema);
      return [
        factory.array(transformedItem as unknown as z.ZodTypeAny),
        arrayPaths,
      ];
    }
    return [schema, arrayPaths];
  }

  if (isKind(schema, "union")) {
    const unionOptions = getUnionOptions(schema);
    if (!unionOptions || unionOptions.length === 0) {
      return [schema, []];
    }
    const newOptions: StagehandZodSchema[] = [];
    let changed = false;
    let allPaths: ZodPathSegments[] = [];

    unionOptions.forEach((option, idx) => {
      const [newOption, childPaths] = transformSchema(option, [
        ...currentPath,
        `union_${idx}`,
      ]);
      if (newOption !== option) {
        changed = true;
      }
      newOptions.push(newOption);
      allPaths = [...allPaths, ...childPaths];
    });

    if (changed) {
      const factory = getZFactory(schema);
      return [
        factory.union(
          newOptions as unknown as [
            z.ZodTypeAny,
            z.ZodTypeAny,
            ...z.ZodTypeAny[],
          ],
        ),
        allPaths,
      ];
    }
    return [schema, allPaths];
  }

  if (isKind(schema, "intersection")) {
    const { left, right } = getIntersectionSides(schema);
    if (!left || !right) {
      return [schema, []];
    }
    const [newLeft, leftPaths] = transformSchema(left, [
      ...currentPath,
      "intersection_left",
    ]);
    const [newRight, rightPaths] = transformSchema(right, [
      ...currentPath,
      "intersection_right",
    ]);
    const changed = newLeft !== left || newRight !== right;
    const allPaths = [...leftPaths, ...rightPaths];
    if (changed) {
      const factory = getZFactory(schema);
      return [
        factory.intersection(
          newLeft as unknown as z.ZodTypeAny,
          newRight as unknown as z.ZodTypeAny,
        ),
        allPaths,
      ];
    }
    return [schema, allPaths];
  }

  if (isKind(schema, "optional")) {
    const innerType = getInnerType(schema);
    if (!innerType) {
      return [schema, []];
    }
    const [inner, innerPaths] = transformSchema(innerType, currentPath);
    if (inner !== innerType) {
      return [
        (inner as z.ZodTypeAny).optional() as unknown as StagehandZodSchema,
        innerPaths,
      ];
    }
    return [schema, innerPaths];
  }

  if (isKind(schema, "nullable")) {
    const innerType = getInnerType(schema);
    if (!innerType) {
      return [schema, []];
    }
    const [inner, innerPaths] = transformSchema(innerType, currentPath);
    if (inner !== innerType) {
      return [
        (inner as z.ZodTypeAny).nullable() as unknown as StagehandZodSchema,
        innerPaths,
      ];
    }
    return [schema, innerPaths];
  }

  if (isKind(schema, "pipe") && isZod4Schema(schema)) {
    const { in: inSchema, out: outSchema } = getPipeEndpoints(schema);
    if (!inSchema || !outSchema) {
      return [schema, []];
    }

    const [newIn, inPaths] = transformSchema(inSchema, currentPath);
    const [newOut, outPaths] = transformSchema(outSchema, currentPath);
    const allPaths = [...inPaths, ...outPaths];

    if (newIn !== inSchema || newOut !== outSchema) {
      const result = z.pipe(
        newIn as unknown as z.ZodTypeAny,
        newOut as unknown as z.ZodTypeAny,
      ) as StagehandZodSchema;
      return [result, allPaths];
    }
    return [schema, allPaths];
  }

  if (isKind(schema, "effects")) {
    const baseSchema = getEffectsBaseSchema(schema);
    if (!baseSchema) {
      return [schema, []];
    }
    return transformSchema(baseSchema, currentPath);
  }

  return [schema, []];
}

/**
 * Once we get the final extracted object that has numeric IDs in place of URLs,
 * use `injectUrls` to walk the object and replace numeric IDs
 * with the real URL strings from idToUrlMapping. The `path` may include `*`
 * for array indices (indicating "all items in the array").
 */
export function injectUrls(
  obj: unknown,
  path: Array<string | number>,
  idToUrlMapping: Record<string, string>,
): void {
  if (path.length === 0) return;
  const toId = (value: unknown): string | undefined => {
    if (typeof value === "number") {
      return String(value);
    }
    if (typeof value === "string" && ID_PATTERN.test(value)) {
      return value;
    }
    return undefined;
  };
  const [key, ...rest] = path;

  if (key === "*") {
    if (Array.isArray(obj)) {
      if (rest.length === 0) {
        for (let i = 0; i < obj.length; i += 1) {
          const id = toId(obj[i]);
          if (id !== undefined) {
            obj[i] = idToUrlMapping[id] ?? "";
          }
        }
      } else {
        for (const item of obj) injectUrls(item, rest, idToUrlMapping);
      }
    }
    return;
  }

  if (obj && typeof obj === "object") {
    const record = obj as Record<string | number, unknown>;
    if (path.length === 1) {
      const fieldValue = record[key];
      const id = toId(fieldValue);
      if (id !== undefined) {
        record[key] = idToUrlMapping[id] ?? "";
      }
    } else {
      injectUrls(record[key], rest, idToUrlMapping);
    }
  }
}

// Helper to check if a schema is of a specific type
function isKind(s: StagehandZodSchema, kind: string): boolean {
  try {
    return getZodType(s) === kind;
  } catch {
    return false;
  }
}

function makeIdStringSchema(orig: StagehandZodSchema): StagehandZodSchema {
  const userDesc =
    (orig as unknown as { description?: string }).description ?? "";

  const base =
    "This field must be the element-ID in the form 'frameId-backendId' " +
    '(e.g. "0-432").';
  const composed =
    userDesc.trim().length > 0
      ? `${base} that follows this user-defined description: ${userDesc}`
      : base;

  const factory = getZFactory(orig);
  return factory.string().regex(ID_PATTERN).describe(composed);
}

/**
 * Mapping from LLM provider names to their corresponding environment variable names for API keys.
 */
export const providerEnvVarMap: Partial<
  Record<ModelProvider | string, string | Array<string>>
> = {
  openai: "OPENAI_API_KEY",
  anthropic: "ANTHROPIC_API_KEY",
  google: ["GEMINI_API_KEY", "GOOGLE_GENERATIVE_AI_API_KEY", "GOOGLE_API_KEY"],
  vertex: "GOOGLE_VERTEX_AI_API_KEY",
  groq: "GROQ_API_KEY",
  cerebras: "CEREBRAS_API_KEY",
  togetherai: "TOGETHER_AI_API_KEY",
  mistral: "MISTRAL_API_KEY",
  deepseek: "DEEPSEEK_API_KEY",
  perplexity: "PERPLEXITY_API_KEY",
  azure: "AZURE_API_KEY",
  xai: "XAI_API_KEY",
  google_legacy: "GOOGLE_API_KEY",
};

const providersWithoutApiKey = new Set(["bedrock", "ollama"]);

/**
 * Loads an API key for a provider, checking environment variables.
 * @param provider The name of the provider (e.g., 'openai', 'anthropic')
 * @param logger Optional logger for info/error messages
 * @returns The API key if found, undefined otherwise
 */
export function loadApiKeyFromEnv(
  provider: string | undefined,
  logger: (logLine: LogLine) => void,
): string | undefined {
  if (!provider) {
    return undefined;
  }

  const envVarName = providerEnvVarMap[provider];
  if (!envVarName) {
    if (!providersWithoutApiKey.has(provider)) {
      logger({
        category: "init",
        message: `No known environment variable for provider '${provider}'`,
        level: 0,
      });
    }
    return undefined;
  }

  const apiKeyFromEnv = Array.isArray(envVarName)
    ? envVarName
        .map((name) => process.env[name])
        .find((key) => key && key.length > 0)
    : process.env[envVarName as string];
  if (typeof apiKeyFromEnv === "string" && apiKeyFromEnv.length > 0) {
    return apiKeyFromEnv;
  }

  // Don't log - this is expected when llmClient is provided or API key will be set later
  return undefined;
}

export function trimTrailingTextNode(
  path: string | undefined,
): string | undefined {
  return path?.replace(/\/text\(\)(\[\d+\])?$/iu, "");
}

export function toTitleCase(str: string): string {
  return str.replace(
    /\w\S*/g,
    (text) => text.charAt(0).toUpperCase() + text.substring(1),
  );
}

// TODO: move to separate types file
export interface JsonSchemaProperty {
  type: string;
  enum?: unknown[];
  items?: JsonSchemaProperty;
  properties?: Record<string, JsonSchemaProperty>;
  required?: string[];
  minimum?: number;
  maximum?: number;
  description?: string;
  format?: string; // JSON Schema format field (e.g., "uri", "url", "email", etc.)
}
export interface JsonSchema extends JsonSchemaProperty {
  type: string;
}

/**
 * Converts a JSON Schema object to a Zod schema
 * @param schema The JSON Schema object to convert
 * @returns A Zod schema equivalent to the input JSON Schema
 */
export function jsonSchemaToZod(schema: JsonSchema): ZodTypeAny {
  switch (schema.type) {
    case "object":
      if (schema.properties) {
        const shape: Record<string, ZodTypeAny> = {};
        for (const key in schema.properties) {
          shape[key] = jsonSchemaToZod(schema.properties[key]);
        }
        let zodObject = z.object(shape);
        if (schema.required && Array.isArray(schema.required)) {
          const requiredFields = schema.required.reduce<Record<string, true>>(
            (acc, field) => ({ ...acc, [field]: true }),
            {},
          );
          zodObject = zodObject.partial().required(requiredFields);
        }
        if (schema.description) {
          zodObject = zodObject.describe(schema.description);
        }
        return zodObject;
      } else {
        return z.object({});
      }
    case "array":
      if (schema.items) {
        let zodArray = z.array(jsonSchemaToZod(schema.items));
        if (schema.description) {
          zodArray = zodArray.describe(schema.description);
        }
        return zodArray;
      } else {
        return z.array(z.any());
      }
    case "string": {
      if (schema.enum) {
        return z.string().refine((val) => schema.enum!.includes(val));
      }
      let zodString = z.string();

      // Handle JSON Schema format field
      if (schema.format === "uri" || schema.format === "url") {
        zodString = zodString.url();
      } else if (schema.format === "email") {
        zodString = zodString.email();
      } else if (schema.format === "uuid") {
        zodString = zodString.uuid();
      }
      // Add more format handlers as needed

      if (schema.description) {
        zodString = zodString.describe(schema.description);
      }
      return zodString;
    }
    case "number": {
      let zodNumber = z.number();
      if (schema.minimum !== undefined) {
        zodNumber = zodNumber.min(schema.minimum);
      }
      if (schema.maximum !== undefined) {
        zodNumber = zodNumber.max(schema.maximum);
      }
      if (schema.description) {
        zodNumber = zodNumber.describe(schema.description);
      }
      return zodNumber;
    }
    case "boolean": {
      let zodBoolean = z.boolean();
      if (schema.description) {
        zodBoolean = zodBoolean.describe(schema.description);
      }
      return zodBoolean;
    }
    default:
      return z.any();
  }
}


================================================
FILE: packages/core/lib/v3/agent/AgentClient.ts
================================================
import {
  AgentAction,
  AgentResult,
  AgentType,
  AgentExecutionOptions,
} from "../types/public/agent.js";
import { ClientOptions } from "../types/public/model.js";

/**
 * Abstract base class for agent clients
 * This provides a common interface for all agent implementations
 */
export abstract class AgentClient {
  public type: AgentType;
  public modelName: string;
  public clientOptions: ClientOptions;
  public userProvidedInstructions?: string;

  constructor(
    type: AgentType,
    modelName: string,
    userProvidedInstructions?: string,
  ) {
    this.type = type;
    this.modelName = modelName;
    this.userProvidedInstructions = userProvidedInstructions;
    this.clientOptions = {};
  }

  abstract execute(options: AgentExecutionOptions): Promise<AgentResult>;

  abstract captureScreenshot(
    options?: Record<string, unknown>,
  ): Promise<unknown>;

  abstract setViewport(width: number, height: number): void;

  abstract setCurrentUrl(url: string): void;

  abstract setScreenshotProvider(provider: () => Promise<string>): void;

  abstract setActionHandler(
    handler: (action: AgentAction) => Promise<void>,
  ): void;

  /** Optional hook called at the top of every step in the agent loop. */
  protected preStepHook?: () => Promise<void>;

  setPreStepHook(handler: () => Promise<void>): void {
    this.preStepHook = handler;
  }

  /**
   * Optional ephemeral context note that should be sent to the next model turn.
   * Clients that do not support this can ignore it.
   */
  addContextNote(note: string): void {
    void note;
    // no-op by default
  }
}


================================================
FILE: packages/core/lib/v3/agent/AgentProvider.ts
================================================
import { ToolSet } from "ai/dist";
import { AgentProviderType } from "../types/public/agent.js";
import { LogLine } from "../types/public/logs.js";
import { ClientOptions } from "../types/public/model.js";
import {
  UnsupportedModelError,
  UnsupportedModelProviderError,
} from "../types/public/sdkErrors.js";
import { AgentClient } from "./AgentClient.js";
import { AnthropicCUAClient } from "./AnthropicCUAClient.js";
import { OpenAICUAClient } from "./OpenAICUAClient.js";
import { GoogleCUAClient } from "./GoogleCUAClient.js";
import { MicrosoftCUAClient } from "./MicrosoftCUAClient.js";

// Map model names to their provider types
export const modelToAgentProviderMap: Record<string, AgentProviderType> = {
  "computer-use-preview": "openai",
  "computer-use-preview-2025-03-11": "openai",
  "claude-sonnet-4-20250514": "anthropic",
  "claude-sonnet-4-5-20250929": "anthropic",
  "claude-opus-4-5-20251101": "anthropic",
  "claude-opus-4-6": "anthropic",
  "claude-sonnet-4-6": "anthropic",
  "claude-haiku-4-5-20251001": "anthropic",
  "gemini-2.5-computer-use-preview-10-2025": "google",
  "gemini-3-flash-preview": "google",
  "gemini-3-pro-preview": "google",
  "fara-7b": "microsoft",
};

/**
 * Provider for agent clients
 * This class is responsible for creating the appropriate agent client
 * based on the provider type
 */
export class AgentProvider {
  private logger: (message: LogLine) => void;

  /**
   * Create a new agent provider
   */
  constructor(logger: (message: LogLine) => void) {
    this.logger = logger;
  }

  getClient(
    modelName: string,
    clientOptions?: ClientOptions,
    userProvidedInstructions?: string,
    tools?: ToolSet,
  ): AgentClient {
    // Check if provider is explicitly set in clientOptions
    const explicitProvider = clientOptions?.provider as
      | AgentProviderType
      | undefined;
    const type = explicitProvider || AgentProvider.getAgentProvider(modelName);

    this.logger({
      category: "agent",
      message: `Getting agent client for type: ${type}, model: ${modelName}${explicitProvider ? " (explicit provider)" : ""}`,
      level: 2,
    });

    try {
      switch (type) {
        case "openai":
          return new OpenAICUAClient(
            type,
            modelName,
            userProvidedInstructions,
            clientOptions,
            tools,
          );
        case "anthropic":
          return new AnthropicCUAClient(
            type,
            modelName,
            userProvidedInstructions,
            clientOptions,
            tools,
          );
        case "google":
          return new GoogleCUAClient(
            type,
            modelName,
            userProvidedInstructions,
            clientOptions,
            tools,
          );
        case "microsoft":
          return new MicrosoftCUAClient(
            type,
            modelName,
            userProvidedInstructions,
            clientOptions,
          );
        default:
          throw new UnsupportedModelProviderError(
            ["openai", "anthropic", "google", "microsoft"],
            "Computer Use Agent",
          );
      }
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      this.logger({
        category: "agent",
        message: `Error creating agent client: ${errorMessage}`,
        level: 0,
      });
      throw error;
    }
  }

  static getAgentProvider(modelName: string): AgentProviderType {
    const normalized = modelName.includes("/")
      ? modelName.split("/")[1]
      : modelName;

    if (normalized in modelToAgentProviderMap) {
      return modelToAgentProviderMap[normalized];
    }

    throw new UnsupportedModelError(
      Object.keys(modelToAgentProviderMap),
      "Computer Use Agent",
    );
  }
}


================================================
FILE: packages/core/lib/v3/agent/AnthropicCUAClient.ts
================================================
import {
  AgentAction,
  AgentResult,
  AgentType,
  AnthropicContentBlock,
  AnthropicMessage,
  AnthropicTextBlock,
  AnthropicToolResult,
  AgentExecutionOptions,
  ToolUseItem,
} from "../types/public/agent.js";
import { LogLine } from "../types/public/logs.js";
import { ClientOptions } from "../types/public/model.js";
import {
  AgentScreenshotProviderError,
  StagehandClosedError,
} from "../types/public/sdkErrors.js";
import Anthropic from "@anthropic-ai/sdk";
import { ToolSet } from "ai";
import { AgentClient } from "./AgentClient.js";
import { compressConversationImages } from "./utils/imageCompression.js";
import { toJsonSchema } from "../zodCompat.js";
import type { StagehandZodSchema } from "../zodCompat.js";
import {
  FlowLogger,
  extractLlmCuaPromptSummary,
  extractLlmCuaResponseSummary,
} from "../flowlogger/FlowLogger.js";
import { v7 as uuidv7 } from "uuid";

export type ResponseInputItem = AnthropicMessage | AnthropicToolResult;

/**
 * Client for Anthropic's Computer Use API
 * This implementation uses the official Anthropic Messages API for Computer Use
 */
export class AnthropicCUAClient extends AgentClient {
  private apiKey: string;
  private baseURL?: string;
  private client: Anthropic;
  public lastMessageId?: string;
  private currentViewport = { width: 1288, height: 711 };
  private currentUrl?: string;
  private screenshotProvider?: () => Promise<string>;
  private actionHandler?: (action: AgentAction) => Promise<void>;
  private thinkingBudget: number | null = null;
  private tools?: ToolSet;

  constructor(
    type: AgentType,
    modelName: string,
    userProvidedInstructions?: string,
    clientOptions?: ClientOptions,
    tools?: ToolSet,
  ) {
    super(type, modelName, userProvidedInstructions);

    // Process client options
    this.apiKey =
      (clientOptions?.apiKey as string) || process.env.ANTHROPIC_API_KEY || "";
    this.baseURL = (clientOptions?.baseURL as string) || undefined;

    // Get thinking budget if specified
    if (
      clientOptions?.thinkingBudget &&
      typeof clientOptions.thinkingBudget === "number"
    ) {
      this.thinkingBudget = clientOptions.thinkingBudget;
    }

    // Store client options for reference
    this.clientOptions = {
      apiKey: this.apiKey,
    };

    if (this.baseURL) {
      this.clientOptions.baseURL = this.baseURL;
    }

    // Initialize the Anthropic client
    this.client = new Anthropic(this.clientOptions);

    this.tools = tools;
  }

  setViewport(width: number, height: number): void {
    this.currentViewport = { width, height };
  }

  setCurrentUrl(url: string): void {
    this.currentUrl = url;
  }

  setScreenshotProvider(provider: () => Promise<string>): void {
    this.screenshotProvider = provider;
  }

  setActionHandler(handler: (action: AgentAction) => Promise<void>): void {
    this.actionHandler = handler;
  }

  setTools(tools: ToolSet): void {
    this.tools = tools;
  }

  /**
   * Execute a task with the Anthropic CUA
   * This is the main entry point for the agent
   * @implements AgentClient.execute
   */
  async execute(executionOptions: AgentExecutionOptions): Promise<AgentResult> {
    const { options, logger } = executionOptions;
    const { instruction } = options;
    const maxSteps = options.maxSteps || 10;

    let currentStep = 0;
    let completed = false;
    const actions: AgentAction[] = [];
    const messageList: string[] = [];
    let finalMessage = "";

    // Start with the initial instruction
    let inputItems: ResponseInputItem[] =
      this.createInitialInputItems(instruction);

    logger({
      category: "agent",
      message: `Starting Anthropic agent execution with instruction: ${instruction}`,
      level: 1,
    });

    let totalInputTokens = 0;
    let totalOutputTokens = 0;
    let totalInferenceTime = 0;

    try {
      // Execute steps until completion or max steps reached
      while (!completed && currentStep < maxSteps) {
        await this.preStepHook?.();

        logger({
          category: "agent",
          message: `Executing step ${currentStep + 1}/${maxSteps}`,
          level: 1,
        });

        const result = await this.executeStep(inputItems, logger);
        totalInputTokens += result.usage.input_tokens;
        totalOutputTokens += result.usage.output_tokens;
        totalInferenceTime += result.usage.inference_time_ms;

        // Add actions to the list
        if (result.actions.length > 0) {
          logger({
            category: "agent",
            message: `Step ${currentStep + 1} performed ${result.actions.length} actions`,
            level: 2,
          });
          actions.push(...result.actions);
        }

        // Update completion status
        completed = result.completed;

        // Update the input items for the next step if we're continuing
        if (!completed) {
          inputItems = result.nextInputItems;
        }

        // Record any message for this step
        if (result.message) {
          messageList.push(result.message);
          finalMessage = result.message;
        }

        // Increment step counter
        currentStep++;
      }

      logger({
        category: "agent",
        message: `Anthropic agent execution completed: ${completed}, with ${actions.length} total actions performed`,
        level: 1,
      });

      // Return the final result
      return {
        success: completed,
        actions,
        message: finalMessage,
        completed,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      logger({
        category: "agent",
        message: `Error executing agent task: ${errorMessage}`,
        level: 0,
      });

      return {
        success: false,
        actions,
        message: `Failed to execute task: ${errorMessage}`,
        completed: false,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    }
  }

  async executeStep(
    inputItems: ResponseInputItem[],
    logger: (message: LogLine) => void,
  ): Promise<{
    actions: AgentAction[];
    message: string;
    completed: boolean;
    nextInputItems: ResponseInputItem[];
    usage: {
      input_tokens: number;
      output_tokens: number;
      inference_time_ms: number;
    };
  }> {
    try {
      // Get response from the model
      const result = await this.getAction(inputItems);
      const content = result.content;
      const usage = {
        input_tokens: result.usage.input_tokens,
        output_tokens: result.usage.output_tokens,
        inference_time_ms: result.usage.inference_time_ms,
      };

      logger({
        category: "agent",
        message: `Received response with ${content.length} content blocks`,
        level: 2,
      });

      // Extract actions from the content
      const stepActions: AgentAction[] = [];
      const toolUseItems: ToolUseItem[] = [];
      let message = "";

      // Process content blocks to find tool use items and text content
      for (const block of content) {
        logger({
          category: "agent",
          message: `Processing block type: ${block.type}, id: ${block.id || "unknown"}`,
          level: 2,
        });

        if (block.type === "tool_use") {
          // Direct handling of tool_use type
          logger({
            category: "agent",
            message: `Found tool_use block: ${JSON.stringify(block)}`,
            level: 2,
          });

          // Cast to ToolUseItem and add to list
          const toolUseItem = block as ToolUseItem;
          toolUseItems.push(toolUseItem);

          logger({
            category: "agent",
            message: `Added tool_use item: ${toolUseItem.name}, action: ${JSON.stringify(toolUseItem.input)}`,
            level: 2,
          });

          // Convert tool use to action and add to actions list
          const action = this.convertToolUseToAction(toolUseItem);
          if (action) {
            logger({
              category: "agent",
              message: `Created action from tool_use: ${toolUseItem.name}, action: ${action.type}`,
              level: 2,
            });
            stepActions.push(action);
          } else if (this.tools && toolUseItem.name in this.tools) {
            stepActions.push({
              type: "custom_tool",
              tool: toolUseItem.name,
              input: toolUseItem.input,
            } as AgentAction);
          }
        } else if (block.type === "text") {
          // Safe to cast here since we've verified it's a text block
          const textBlock = block as unknown as AnthropicTextBlock;
          message += textBlock.text + "\n";

          logger({
            category: "agent",
            message: `Found text block: ${textBlock.text}`,
            level: 2,
          });
        } else {
          logger({
            category: "agent",
            message: `Found unknown block type: ${block.type}`,
            level: 2,
          });
        }
      }

      // Execute actions if an action handler is provided
      if (this.actionHandler && stepActions.length > 0) {
        for (const action of stepActions) {
          try {
            logger({
              category: "agent",
              message: `Executing action: ${action.type}`,
              level: 1,
            });
            await this.actionHandler(action);
          } catch (error) {
            if (error instanceof StagehandClosedError) {
              throw error;
            }
            const errorMessage =
              error instanceof Error ? error.message : String(error);
            logger({
              category: "agent",
              message: `Error executing action ${action.type}: ${errorMessage}`,
              level: 0,
            });
          }
        }
      }

      // Create the assistant response message with all content blocks
      const assistantMessage: AnthropicMessage = {
        role: "assistant",
        content: content as unknown as AnthropicContentBlock[],
      };

      // Keep track of the conversation history by preserving all previous messages
      // and adding new messages at the end
      const nextInputItems: ResponseInputItem[] = [...inputItems];

      // Add the assistant message with tool_use blocks to the history
      compressConversationImages(nextInputItems);

      nextInputItems.push(assistantMessage);

      // Generate tool results and add them as a user message
      if (toolUseItems.length > 0) {
        const toolResults = await this.takeAction(toolUseItems, logger);

        if (toolResults.length > 0) {
          // Tool results are AnthropicToolResult[] which are compatible with AnthropicContentBlock[]
          const userToolResultsMessage: AnthropicMessage = {
            role: "user",
            content: toolResults as unknown as AnthropicContentBlock[],
          };
          nextInputItems.push(userToolResultsMessage);
        }
      }

      // The step is completed only if there were no tool_use items
      const completed = toolUseItems.length === 0;

      logger({
        category: "agent",
        message: `Step processed ${toolUseItems.length} tool use items, completed: ${completed}`,
        level: 2,
      });

      return {
        actions: stepActions,
        message: message.trim(),
        completed,
        nextInputItems,
        usage: usage,
      };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      logger({
        category: "agent",
        message: `Error executing step: ${errorMessage}`,
        level: 0,
      });

      throw error;
    }
  }

  private createInitialInputItems(instruction: string): AnthropicMessage[] {
    // For the initial request, we use a simple array with the user's instruction
    return [
      {
        role: "system",
        content: this.userProvidedInstructions,
      },
      {
        role: "user",
        content: instruction,
      },
    ];
  }

  async getAction(inputItems: ResponseInputItem[]): Promise<{
    content: AnthropicContentBlock[];
    id: string;
    usage: Record<string, number>;
  }> {
    try {
      // For the API request, we use the inputItems directly
      // These should already be properly formatted as a sequence of user/assistant messages
      const messages: AnthropicMessage[] = [];

      for (const item of inputItems) {
        if ("role" in item) {
          // Skip system messages as Anthropic requires system as a top-level parameter
          if (item.role !== "system") {
            messages.push(item);
          }
        }
        // Note: We don't need special handling for tool_result items here anymore
        // as they should already be properly wrapped in user messages
      }

      // Configure thinking capability if available
      const thinking = this.thinkingBudget
        ? { type: "enabled" as const, budget_tokens: this.thinkingBudget }
        : undefined;

      // Claude 4.6+ models require the newer computer_20251124 tool version
      const modelBase = this.modelName.includes("/")
        ? this.modelName.split("/")[1]
        : this.modelName;
      const shouldUseNewToolVersion = [
        "claude-opus-4-6",
        "claude-sonnet-4-6",
        "claude-opus-4-5-20251101",
      ].includes(modelBase);

      const computerToolType = shouldUseNewToolVersion
        ? "computer_20251124"
        : "computer_20250124";
      const betaFlag = shouldUseNewToolVersion
        ? "computer-use-2025-11-24"
        : "computer-use-2025-01-24";

      // Create the request parameters
      const requestParams: Record<string, unknown> = {
        model: this.modelName,
        max_tokens: 4096,
        messages: messages,
        tools: [
          {
            type: computerToolType,
            name: "computer",
            display_width_px: this.currentViewport.width,
            display_height_px: this.currentViewport.height,
            display_number: 1,
          },
        ],
        betas: [betaFlag],
      };

      // Add custom tools if available
      if (this.tools && Object.keys(this.tools).length > 0) {
        const customTools = Object.entries(this.tools).map(([name, tool]) => {
          const schema = tool.inputSchema as StagehandZodSchema;

          // Convert Zod schema to proper JSON schema format for Anthropic
          const jsonSchema = toJsonSchema(schema) as {
            properties?: Record<string, unknown>;
            required?: string[];
          };

          const inputSchema = {
            type: "object",
            properties: jsonSchema.properties || {},
            required: jsonSchema.required || [],
          };

          return {
            name,
            description: tool.description,
            input_schema: inputSchema,
          };
        });

        requestParams.tools = [
          ...(requestParams.tools as Record<string, unknown>[]),
          ...customTools,
        ];
      }

      // Add system parameter if provided
      if (this.userProvidedInstructions) {
        requestParams.system = this.userProvidedInstructions;
      }

      // Add thinking parameter if available
      if (thinking) {
        requestParams.thinking = thinking;
      }

      // Log LLM request
      const llmRequestId = uuidv7();
      FlowLogger.logLlmRequest({
        requestId: llmRequestId,
        model: this.modelName,
        prompt: extractLlmCuaPromptSummary(messages),
      });

      const startTime = Date.now();
      // Create the message using the Anthropic Messages API
      // @ts-expect-error - The Anthropic SDK types are stricter than what we need
      const response = await this.client.beta.messages.create(requestParams);
      const endTime = Date.now();
      const elapsedMs = endTime - startTime;
      const usage = {
        input_tokens: response.usage.input_tokens,
        output_tokens: response.usage.output_tokens,
        inference_time_ms: elapsedMs,
      };

      // Log LLM response
      FlowLogger.logLlmResponse({
        requestId: llmRequestId,
        model: this.modelName,
        output: extractLlmCuaResponseSummary(response.content),
        inputTokens: response.usage.input_tokens,
        outputTokens: response.usage.output_tokens,
      });

      // Store the message ID for future use
      this.lastMessageId = response.id;

      // Return the content and message ID
      return {
        // Cast the response content to our internal type
        content: response.content as unknown as AnthropicContentBlock[],
        id: response.id,
        usage,
      };
    } catch (error) {
      console.error("Error getting action from Anthropic:", error);
      throw error;
    }
  }

  async takeAction(
    toolUseItems: ToolUseItem[],
    logger: (message: LogLine) => void,
  ): Promise<AnthropicToolResult[]> {
    const toolResults: AnthropicToolResult[] = [];

    logger({
      category: "agent",
      message: `Taking action on ${toolUseItems.length} tool use items`,
      level: 2,
    });

    // Process each tool use item
    for (const item of toolUseItems) {
      try {
        logger({
          category: "agent",
          message: `Processing tool use: ${item.name}, id: ${item.id}, action: ${JSON.stringify(item.input)}`,
          level: 2,
        });

        // TODO: Normalize and migrate to agentHandler

        // For computer tool, capture screenshot and return image
        if (item.name === "computer") {
          // Get action type
          const action = item.input.action as string;
          logger({
            category: "agent",
            message: `Computer action type: ${action}`,
            level: 2,
          });

          // Capture a screenshot for the response
          const screenshot = await this.captureScreenshot();
          logger({
            category: "agent",
            message: `Screenshot captured, length: ${screenshot.length}`,
            level: 2,
          });

          // Create proper image content block for Anthropic
          const imageContent = [
            {
              type: "image",
              source: {
                type: "base64",
                media_type: "image/png",
                data: screenshot.replace(/^data:image\/png;base64,/, ""),
              },
            },
          ];

          // Add current URL if available
          if (this.currentUrl) {
            toolResults.push({
              type: "tool_result",
              tool_use_id: item.id,
              content: [
                ...imageContent,
                {
                  type: "text",
                  text: `Current URL: ${this.currentUrl}`,
                },
              ],
            });
          } else {
            toolResults.push({
              type: "tool_result",
              tool_use_id: item.id,
              content: imageContent,
            });
          }

          logger({
            category: "agent",
            message: `Added computer tool result for tool_use_id: ${item.id}`,
            level: 2,
          });
        } else {
          // Handle custom tools
          let toolResult = "Tool executed successfully";
          if (this.tools && item.name in this.tools) {
            try {
              const tool = this.tools[item.name];

              logger({
                category: "agent",
                message: `Executing tool call: ${item.name} with args: ${JSON.stringify(item.input)}`,
                level: 1,
              });

              const result = await tool.execute(item.input, {
                toolCallId: item.id,
                messages: [],
              });
              toolResult = JSON.stringify(result);

              logger({
                category: "agent",
                message: `Tool ${item.name} completed successfully. Result: ${toolResult}`,
                level: 1,
              });
            } catch (toolError) {
              const errorMessage =
                toolError instanceof Error
                  ? toolError.message
                  : String(toolError);
              toolResult = `Error executing tool: ${errorMessage}`;

              logger({
                category: "agent",
                message: `Error executing tool ${item.name}: ${errorMessage}`,
                level: 0,
              });
            }
          }

          toolResults.push({
            type: "tool_result",
            tool_use_id: item.id,
            content: [
              {
                type: "text",
                text: toolResult,
              },
            ],
          });

          logger({
            category: "agent",
            message: `Added custom tool result for tool ${item.name}, tool_use_id: ${item.id}`,
            level: 2,
          });
        }
      } catch (error) {
        const errorMessage =
          error instanceof Error ? error.message : String(error);

        logger({
          category: "agent",
          message: `Error executing tool use: ${errorMessage}`,
          level: 0,
        });

        try {
          // For computer tool, try to capture a screenshot even on error
          if (item.name === "computer") {
            const screenshot = await this.captureScreenshot();

            toolResults.push({
              type: "tool_result",
              tool_use_id: item.id,
              content: [
                {
                  type: "image",
                  source: {
                    type: "base64",
                    media_type: "image/png",
                    data: screenshot.replace(/^data:image\/png;base64,/, ""),
                  },
                },
                {
                  type: "text",
                  text: `Error: ${errorMessage}`,
                },
              ],
            });

            logger({
              category: "agent",
              message: `Added error tool result with screenshot for tool_use_id: ${item.id}`,
              level: 1,
            });
          } else {
            // For other tools, return an error message as a text content block
            toolResults.push({
              type: "tool_result",
              tool_use_id: item.id,
              content: [
                {
                  type: "text",
                  text: `Error: ${errorMessage}`,
                },
              ],
            });

            logger({
              category: "agent",
              message: `Added error tool result for tool_use_id: ${item.id}`,
              level: 1,
            });
          }
        } catch (screenshotError) {
          // If we can't capture a screenshot, just send the error
          logger({
            category: "agent",
            message: `Error capturing screenshot: ${String(screenshotError)}`,
            level: 0,
          });

          toolResults.push({
            type: "tool_result",
            tool_use_id: item.id,
            content: [
              {
                type: "text",
                text: `Error: ${errorMessage}`,
              },
            ],
          });

          logger({
            category: "agent",
            message: `Added text error tool result for tool_use_id: ${item.id}`,
            level: 1,
          });
        }
      }
    }

    logger({
      category: "agent",
      message: `Prepared ${toolResults.length} tool results for next request`,
      level: 2,
    });

    return toolResults;
  }

  private convertToolUseToAction(item: ToolUseItem): AgentAction | null {
    try {
      const { name, input } = item;

      if (name === "computer") {
        // For computer actions, format according to the action type
        const action = input.action as string;

        if (!action) {
          console.warn("Missing action in tool use item:", item);
          return null;
        }

        // Handle different action types specifically
        if (action === "screenshot") {
          return {
            type: "screenshot",
            ...input,
          };
        } else if (action === "click") {
          return {
            type: "click",
            x: input.x as number,
            y: input.y as number,
            button: (input.button as string) || "left",
            ...input,
          };
        } else if (action === "type") {
          return {
            type: "type",
            text: input.text as string,
            ...input,
          };
        } else if (action === "keypress" || action === "key") {
          return {
            type: "keypress",
            keys: [input.text as string],
            ...input,
          };
        } else if (action === "double_click" || action === "doubleClick") {
          return {
            type: "doubleClick",
            x:
              (input.x as number) ||
              (input.coordinate ? (input.coordinate as number[])[0] : 0),
            y:
              (input.y as number) ||
              (input.coordinate ? (input.coordinate as number[])[1] : 0),
            ...input,
          };
        } else if (action === "scroll") {
          // Convert Anthropic's coordinate, scroll_amount and scroll_direction into scroll_x and scroll_y
          const x =
            (input.x as number) ||
            (input.coordinate ? (input.coordinate as number[])[0] : 0);
          const y =
            (input.y as number) ||
            (input.coordinate ? (input.coordinate as number[])[1] : 0);

          // Calculate scroll_x and scroll_y based on scroll_amount and scroll_direction
          let scroll_x = 0;
          let scroll_y = 0;

          const scrollAmount = (input.scroll_amount as number) || 5;
          const scrollMultiplier = 100; // Pixels per unit of scroll_amount

          if (input.scroll_direction) {
            const direction = input.scroll_direction as string;
            if (direction === "down") {
              scroll_y = scrollAmount * scrollMultiplier;
            } else if (direction === "up") {
              scroll_y = -scrollAmount * scrollMultiplier;
            } else if (direction === "right") {
              scroll_x = scrollAmount * scrollMultiplier;
            } else if (direction === "left") {
              scroll_x = -scrollAmount * scrollMultiplier;
            }
          } else {
            // Use direct scroll_x and scroll_y if provided
            scroll_x = (input.scroll_x as number) || 0;
            scroll_y = (input.scroll_y as number) || 0;
          }

          return {
            type: "scroll",
            x: x,
            y: y,
            scroll_x: scroll_x,
            scroll_y: scroll_y,
            ...input,
          };
        } else if (action === "move") {
          // Handle Anthropic's coordinate format
          const coordinates = input.coordinate as number[] | undefined;
          const x = coordinates ? coordinates[0] : (input.x as number) || 0;
          const y = coordinates ? coordinates[1] : (input.y as number) || 0;

          return {
            type: "move",
            x: x,
            y: y,
            ...input,
          };
        } else if (action === "drag" || action === "left_click_drag") {
          // Make sure path is properly formatted
          const path =
            (input.path as { x: number; y: number }[]) ||
            (input.coordinate
              ? [
                  {
                    x: (input.start_coordinate as number[])[0],
                    y: (input.start_coordinate as number[])[1],
                  },
                  {
                    x: (input.coordinate as number[])[0],
                    y: (input.coordinate as number[])[1],
                  },
                ]
              : []);

          return {
            type: "drag",
            path: path,
            ...input,
          };
        } else if (action === "wait") {
          return {
            type: "wait",
            ...input,
          };
        } else if (action === "left_click") {
          // Convert left_click to regular click
          const coordinates = input.coordinate as number[] | undefined;
          const x = coordinates ? coordinates[0] : (input.x as number) || 0;
          const y = coordinates ? coordinates[1] : (input.y as number) || 0;

          return {
            type: "click",
            x: x,
            y: y,
            button: "left",
            ...input,
          };
        } else {
          // For other computer actions, use the action type directly
          return {
            type: action,
            ...input,
          };
        }
      } else if (name === "str_replace_editor" || name === "bash") {
        // For editor or bash tools
        return {
          type: name,
          params: input,
        };
      } else if (this.tools && name in this.tools) {
        return null;
      }

      console.warn(`Unknown tool name: ${name}`);
      return null;
    } catch (error) {
      console.error("Error converting tool use to action:", error);
      return null;
    }
  }

  async captureScreenshot(options?: {
    base64Image?: string;
    currentUrl?: string;
  }): Promise<string> {
    // Use provided options if available
    if (options?.base64Image) {
      return `data:image/png;base64,${options.base64Image}`;
    }

    // Use the screenshot provider if available
    if (this.screenshotProvider) {
      try {
        const base64Image = await this.screenshotProvider();
        return `data:image/png;base64,${base64Image}`;
      } catch (error) {
        console.error("Error capturing screenshot:", error);
        throw error;
      }
    }

    throw new AgentScreenshotProviderError(
      "`screenshotProvider` has not been set. " +
        "Please call `setScreenshotProvider()` with a valid function that returns a base64-encoded image",
    );
  }
}


================================================
FILE: packages/core/lib/v3/agent/GoogleCUAClient.ts
================================================
import {
  GoogleGenAI,
  Content,
  Part,
  GenerateContentResponse,
  FunctionCall,
  GenerateContentConfig,
  Tool,
  GoogleGenAIOptions,
} from "@google/genai";
import { LogLine } from "../types/public/logs.js";
import {
  AgentAction,
  AgentResult,
  AgentType,
  AgentExecutionOptions,
  SafetyCheck,
  SafetyConfirmationHandler,
} from "../types/public/agent.js";
import { ClientOptions } from "../types/public/model.js";
import { AgentClient } from "./AgentClient.js";
import {
  AgentScreenshotProviderError,
  LLMResponseError,
  StagehandClosedError,
} from "../types/public/sdkErrors.js";
import { buildGoogleCUASystemPrompt } from "../../prompt.js";
import { compressGoogleConversationImages } from "./utils/imageCompression.js";
import { mapKeyToPlaywright } from "./utils/cuaKeyMapping.js";
import {
  executeGoogleCustomTool,
  isCustomTool,
  convertToolSetToFunctionDeclarations,
} from "./utils/googleCustomToolHandler.js";
import { ToolSet } from "ai";
import {
  FlowLogger,
  extractLlmCuaPromptSummary,
  extractLlmCuaResponseSummary,
} from "../flowlogger/FlowLogger.js";
import { v7 as uuidv7 } from "uuid";

/**
 * Client for Google's Computer Use Assistant API
 * This implementation uses the Google Generative AI SDK for Computer Use
 */
export class GoogleCUAClient extends AgentClient {
  private apiKey: string;
  private client: GoogleGenAI;
  private currentViewport = { width: 1288, height: 711 };
  private currentUrl?: string;
  private screenshotProvider?: () => Promise<string>;
  private actionHandler?: (action: AgentAction) => Promise<void>;
  private history: Content[] = [];
  private environment: "ENVIRONMENT_BROWSER" | "ENVIRONMENT_DESKTOP" =
    "ENVIRONMENT_BROWSER";
  private generateContentConfig: GenerateContentConfig;
  private tools?: ToolSet;
  private baseURL?: string;
  private safetyConfirmationHandler?: SafetyConfirmationHandler;
  constructor(
    type: AgentType,
    modelName: string,
    userProvidedInstructions?: string,
    clientOptions?: ClientOptions,
    tools?: ToolSet,
  ) {
    super(type, modelName, userProvidedInstructions);

    this.tools = tools;
    // Process client options
    this.apiKey =
      (clientOptions?.apiKey as string) ||
      process.env.GEMINI_API_KEY ||
      process.env.GOOGLE_GENERATIVE_AI_API_KEY ||
      process.env.GOOGLE_API_KEY ||
      "";
    this.baseURL = clientOptions?.baseURL as string | undefined;

    // Initialize the Google Generative AI client
    const genAIOptions: GoogleGenAIOptions = {
      apiKey: this.apiKey,
      ...(this.baseURL ? { httpOptions: { baseUrl: this.baseURL } } : {}),
    };
    this.client = new GoogleGenAI(genAIOptions);

    // Get environment if specified
    if (
      clientOptions?.environment &&
      typeof clientOptions.environment === "string"
    ) {
      this.environment = clientOptions.environment as typeof this.environment;
    }

    this.generateContentConfig = {
      temperature: 1,
      topP: 0.95,
      topK: 40,
      maxOutputTokens: 8192,
      // systemInstruction: this.userProvidedInstructions
      //   ? { parts: [{ text: this.userProvidedInstructions }] }
      //   : { parts: [{ text: buildGoogleCUASystemPrompt() }] },
      tools: [
        {
          computerUse: {
            environment: this.environment,
          },
        } as Tool,
      ],
    };

    // Store client options for reference
    this.clientOptions = {
      apiKey: this.apiKey,
      ...(this.baseURL ? { baseURL: this.baseURL } : {}),
    };

    // Initialize tools if provided
    if (this.tools && Object.keys(this.tools).length > 0) {
      this.updateGenerateContentConfig();
    }
  }

  public setViewport(width: number, height: number): void {
    this.currentViewport = { width, height };
  }

  setCurrentUrl(url: string): void {
    this.currentUrl = url;
  }

  setScreenshotProvider(provider: () => Promise<string>): void {
    this.screenshotProvider = provider;
  }

  setActionHandler(handler: (action: AgentAction) => Promise<void>): void {
    this.actionHandler = handler;
  }

  setTools(tools: ToolSet): void {
    this.tools = tools;
    this.updateGenerateContentConfig();
  }

  setSafetyConfirmationHandler(handler?: SafetyConfirmationHandler): void {
    this.safetyConfirmationHandler = handler;
  }

  private async handleSafetyConfirmation(
    safetyDecision: unknown,
    logger: (message: LogLine) => void,
  ): Promise<string | undefined> {
    const safetyMessage =
      typeof safetyDecision === "object"
        ? JSON.stringify(safetyDecision, null, 2)
        : String(safetyDecision);

    const safetyChecks: SafetyCheck[] = [
      {
        id: "google-safety-decision",
        code: "safety_decision",
        message: safetyMessage,
      },
    ];

    if (this.safetyConfirmationHandler) {
      logger({
        category: "agent",
        message: `Requesting safety confirmation for Google safety decision: ${safetyMessage}`,
        level: 1,
      });

      const response = await this.safetyConfirmationHandler(safetyChecks);

      if (response.acknowledged) {
        logger({
          category: "agent",
          message: `Safety decision acknowledged by user`,
          level: 1,
        });
        return "true";
      } else {
        logger({
          category: "agent",
          message: `Safety decision rejected by user`,
          level: 1,
        });
        return undefined;
      }
    }

    logger({
      category: "agent",
      message: `Auto-acknowledging Google safety decision`,
      level: 2,
    });
    return "true";
  }

  /**
   * Update the generateContentConfig with current tools
   */
  private updateGenerateContentConfig(): void {
    const functionDeclarations =
      this.tools && Object.keys(this.tools).length > 0
        ? convertToolSetToFunctionDeclarations(this.tools)
        : [];

    this.generateContentConfig = {
      ...this.generateContentConfig,
      tools: [
        {
          computerUse: {
            environment: this.environment,
          },
          ...(functionDeclarations.length > 0 ? { functionDeclarations } : {}),
        } as Tool,
      ],
    };
  }

  /**
   * Execute a task with the Google CUA
   * This is the main entry point for the agent
   * @implements AgentClient.execute
   */
  async execute(executionOptions: AgentExecutionOptions): Promise<AgentResult> {
    const { options, logger } = executionOptions;
    const { instruction } = options;
    const maxSteps = options.maxSteps || 10;

    let currentStep = 0;
    let completed = false;
    const actions: AgentAction[] = [];
    const messageList: string[] = [];
    let finalMessage = "";
    this.history = []; // Clear history for new execution

    // Start with the initial instruction
    await this.initializeHistory(instruction);

    let totalInputTokens = 0;
    let totalOutputTokens = 0;
    let totalInferenceTime = 0;

    try {
      // Execute steps until completion or max steps reached
      while (!completed && currentStep < maxSteps) {
        await this.preStepHook?.();

        logger({
          category: "agent",
          message: `Executing step ${currentStep + 1}/${maxSteps}`,
          level: 1,
        });

        const result = await this.executeStep(logger);
        totalInputTokens += result.usage.input_tokens;
        totalOutputTokens += result.usage.output_tokens;
        totalInferenceTime += result.usage.inference_time_ms;

        // Add actions to the list
        actions.push(...result.actions);

        // Update completion status
        completed = result.completed;

        // Record any message for this step
        if (result.message) {
          messageList.push(result.message);
          finalMessage = result.message;
        }

        // Increment step counter
        currentStep++;
      }

      // Return the final result
      return {
        success: completed,
        actions,
        message: finalMessage,
        completed,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      logger({
        category: "agent",
        message: `Error executing agent task: ${errorMessage}`,
        level: 0,
      });

      return {
        success: false,
        actions,
        message: `Failed to execute task: ${errorMessage}`,
        completed: false,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    }
  }

  /**
   * Initialize conversation history with the initial instruction
   */
  private async initializeHistory(instruction: string): Promise<void> {
    const parts: Part[] = [{ text: instruction }];

    // Note: The Python implementation doesn't include the initial screenshot
    // Following the same pattern here

    const systemPromptContent = this.userProvidedInstructions
      ? this.userProvidedInstructions
      : buildGoogleCUASystemPrompt().content;

    this.history = [
      {
        role: "user",
        parts: [
          {
            text: "System prompt: " + systemPromptContent,
          },
        ],
      },
      {
        role: "user",
        parts,
      },
    ];
  }

  /**
   * Execute a single step of the agent
   */
  async executeStep(logger: (message: LogLine) => void): Promise<{
    actions: AgentAction[];
    message: string;
    completed: boolean;
    usage: {
      input_tokens: number;
      output_tokens: number;
      inference_time_ms: number;
    };
  }> {
    try {
      const startTime = Date.now();

      // Compress images in conversation history before sending to the model
      const compressedResult = compressGoogleConversationImages(
        this.history,
        2,
      );
      const compressedHistory = compressedResult.items;

      // Use the SDK's generateContent method with retry logic (matching Python's get_model_response)
      const maxRetries = 5;
      const baseDelayS = 1;
      let lastError: Error | null = null;
      let response: GenerateContentResponse | null = null;

      // Log LLM request
      const llmRequestId = uuidv7();
      FlowLogger.logLlmRequest({
        requestId: llmRequestId,
        model: this.modelName,
        prompt: extractLlmCuaPromptSummary(compressedHistory),
      });

      for (let attempt = 0; attempt < maxRetries; attempt++) {
        try {
          // Add exponential backoff delay for retries
          if (attempt > 0) {
            const delay = baseDelayS * Math.pow(2, attempt) * 1000; // Convert to ms
            logger({
              category: "agent",
              message: `Generating content failed on attempt ${attempt + 1}. Retrying in ${delay / 1000} seconds...`,
              level: 2,
            });
            await new Promise((resolve) => setTimeout(resolve, delay));
          }

          // Use the SDK's generateContent method - following Python SDK pattern
          response = await this.client.models.generateContent({
            model: this.modelName,
            contents: compressedHistory,
            config: this.generateContentConfig,
          });

          // Check if we have valid response content
          if (!response.candidates || response.candidates.length === 0) {
            throw new LLMResponseError("agent", "Response has no candidates!");
          }

          const candidate = response.candidates[0];
          if (!candidate.content || !candidate.content.parts) {
            const reason = candidate.finishReason || "unknown";
            throw new LLMResponseError(
              "agent",
              `Response has no content (finish reason: ${reason})`,
            );
          }

          // Success - we have a valid response
          break;
        } catch (error) {
          lastError = error instanceof Error ? error : new Error(String(error));
          logger({
            category: "agent",
            message: `API call error: ${lastError.message}`,
            level: 2,
          });

          // If this was the last attempt, throw the error
          if (attempt === maxRetries - 1) {
            logger({
              category: "agent",
              message: `Generating content failed after ${maxRetries} attempts.`,
              level: 0,
            });
            throw lastError;
          }
        }
      }

      if (!response) {
        throw (
          lastError || new Error("Failed to get response after all retries")
        );
      }

      const endTime = Date.now();
      const elapsedMs = endTime - startTime;
      const { usageMetadata } = response;

      // Log LLM response
      FlowLogger.logLlmResponse({
        requestId: llmRequestId,
        model: this.modelName,
        output: extractLlmCuaResponseSummary(response),
        inputTokens: usageMetadata?.promptTokenCount,
        outputTokens: usageMetadata?.candidatesTokenCount,
      });

      // Process the response
      const result = await this.processResponse(response, logger);

      // Add model response to history
      if (response.candidates && response.candidates[0]) {
        // Sanitize any out-of-range coordinates in function calls before adding to history
        const sanitizedContent = JSON.parse(
          JSON.stringify(response.candidates[0].content),
        );
        if (sanitizedContent.parts) {
          for (const part of sanitizedContent.parts) {
            if (part.functionCall?.args) {
              if (
                typeof part.functionCall.args.x === "number" &&
                part.functionCall.args.x > 999
              ) {
                part.functionCall.args.x = 999;
              }
              if (
                typeof part.functionCall.args.y === "number" &&
                part.functionCall.args.y > 999
              ) {
                part.functionCall.args.y = 999;
              }
            }
          }
        }
        this.history.push(sanitizedContent);
      }

      // Execute actions and collect function responses
      const functionResponses: Part[] = [];

      if (result.actions.length > 0) {
        let hasError = false;

        // Execute all actions
        for (let i = 0; i < result.actions.length; i++) {
          const action = result.actions[i];

          logger({
            category: "agent",
            message: `Executing action ${i + 1}/${result.actions.length}: ${action.type}`,
            level: 2,
          });

          // Special handling for open_web_browser - don't execute it
          if (action.type === "open_web_browser") {
            // Set pageUrl for open_web_browser since it doesn't go through action handler
            action.pageUrl = this.currentUrl;
            logger({
              category: "agent",
              message: "Skipping open_web_browser action",
              level: 2,
            });
          } else if (action.type === "custom_tool") {
            const toolName = action.name as string;
            const toolArgs = action.arguments as Record<string, unknown>;

            if (this.tools && toolName in this.tools) {
              const correspondingFunctionCall = result.functionCalls.find(
                (fc) => fc.name === toolName,
              );

              if (correspondingFunctionCall) {
                const executionResult = await executeGoogleCustomTool(
                  toolName,
                  toolArgs,
                  this.tools,
                  correspondingFunctionCall,
                  logger,
                );

                functionResponses.push(executionResult.functionResponse);

                if (!executionResult.success) {
                  hasError = true;
                }
              }
            }
          } else if (this.actionHandler) {
            try {
              await this.actionHandler(action);

              // Add a delay between actions to ensure they complete properly
              // Longer delay for typing actions to ensure fields are ready
              if (i < result.actions.length - 1) {
                const nextAction = result.actions[i + 1];
                const isTypingAction =
                  action.type === "type" || nextAction.type === "type";
                const delay = isTypingAction ? 500 : 200;
                await new Promise((resolve) => setTimeout(resolve, delay));
              }
            } catch (actionError) {
              if (actionError instanceof StagehandClosedError) {
                throw actionError;
              }
              logger({
                category: "agent",
                message: `Error executing action ${action.type}: ${actionError}`,
                level: 0,
              });
              hasError = true;
              // Continue processing other actions even if one fails
            }
          }
        }

        // Create function responses for computer use actions (non-custom tools)
        // We need exactly one response per function call, regardless of how many actions were generated
        if (result.functionCalls.length > 0 || hasError) {
          // Filter out custom tool function calls as they've already been handled
          const computerUseFunctionCalls = result.functionCalls.filter(
            (fc) => !isCustomTool(fc, this.tools),
          );

          if (computerUseFunctionCalls.length > 0) {
            try {
              logger({
                category: "agent",
                message: `Taking screenshot after executing ${result.actions.length} actions${hasError ? " (with errors)" : ""}`,
                level: 2,
              });

              const screenshot = await this.captureScreenshot();
              const base64Data = screenshot.replace(
                /^data:image\/png;base64,/,
                "",
              );

              // Create one function response for each computer use function call
              // Following Python SDK pattern: FunctionResponse with parts containing inline_data
              for (const functionCall of computerUseFunctionCalls) {
                let safetyAcknowledgement: string | undefined;
                if (functionCall.args?.safety_decision) {
                  safetyAcknowledgement = await this.handleSafetyConfirmation(
                    functionCall.args.safety_decision,
                    logger,
                  );
                }

                const functionResponsePart: Part = {
                  functionResponse: {
                    name: functionCall.name,
                    response: {
                      url: this.currentUrl || "",
                      ...(safetyAcknowledgement !== undefined
                        ? {
                            safety_acknowledgement: safetyAcknowledgement,
                          }
                        : {}),
                    },
                    parts: [
                      {
                        inlineData: {
                          mimeType: "image/png",
                          data: base64Data,
                        },
                      },
                    ],
                  },
                };
                functionResponses.push(functionResponsePart);
              }
            } catch (error) {
              logger({
                category: "agent",
                message: `Error capturing screenshot: ${error}`,
                level: 0,
              });
            }
          }
        }

        // Add all function responses to history in a single user message
        if (functionResponses.length > 0) {
          logger({
            category: "agent",
            message: `Adding ${functionResponses.length} function responses to history`,
            level: 2,
          });
          this.history.push({
            role: "user",
            parts: functionResponses,
          });
        }
      }

      return {
        actions: result.actions,
        message: result.message,
        completed: result.completed,
        usage: {
          input_tokens: usageMetadata?.promptTokenCount || 0,
          output_tokens: usageMetadata?.candidatesTokenCount || 0,
          inference_time_ms: elapsedMs,
        },
      };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      logger({
        category: "agent",
        message: `Error executing step: ${errorMessage}`,
        level: 0,
      });

      throw error;
    }
  }

  /**
   * Process the response from Google's API
   */
  private async processResponse(
    response: GenerateContentResponse,
    logger: (message: LogLine) => void,
  ): Promise<{
    actions: AgentAction[];
    message: string;
    completed: boolean;
    functionCalls: FunctionCall[];
  }> {
    const actions: AgentAction[] = [];
    let message = "";
    const functionCalls: FunctionCall[] = [];

    if (!response.candidates || response.candidates.length === 0) {
      return {
        actions: [],
        message: "No candidates in response",
        completed: true,
        functionCalls: [],
      };
    }
    const candidate = response.candidates[0];

    // Log the raw response for debugging
    logger({
      category: "agent",
      message: `Raw response from Google: ${JSON.stringify(candidate.content, null, 2)}`,
      level: 2,
    });

    // Process all parts - Google can send multiple function calls
    for (const part of candidate.content.parts) {
      if (part.text) {
        message += part.text + "\n";
        logger({
          category: "agent",
          message: `Reasoning: ${part.text}`,
          level: 1,
        });
      }
      if (part.functionCall) {
        functionCalls.push(part.functionCall);
        logger({
          category: "agent",
          message: `Found function call: ${part.functionCall.name} with args: ${JSON.stringify(part.functionCall.args)}`,
          level: 2,
        });

        // Convert function call to action(s)
        const action = this.convertFunctionCallToAction(part.functionCall);
        if (action) {
          // Special handling for type_text_at - we need to click first
          if (
            part.functionCall.name === "type_text_at" &&
            action.type === "type"
          ) {
            logger({
              category: "agent",
              message: `Adding action: ${JSON.stringify(action)}`,
              level: 2,
            });
            // First add a click action at the same coordinates
            actions.push({
              type: "click",
              x: action.x,
              y: action.y,
              button: "left",
            });

            // If clear_before_typing is true (default), add a select all
            if (action.clearBeforeTyping) {
              // Select all text in the field
              actions.push({
                type: "keypress",
                keys: ["ControlOrMeta+A"],
              });
              actions.push({
                type: "keypress",
                keys: ["Backspace"],
              });
            }

            // Then add the type action
            actions.push(action);
            if (action.pressEnter) {
              actions.push({
                type: "keypress",
                keys: ["Enter"],
              });
            }
          } else {
            actions.push(action);
          }
        } else {
          logger({
            category: "agent",
            message: `Warning: Could not convert function call ${part.functionCall.name} to action`,
            level: 1,
          });
        }
      }
    }

    // Log summary of what we found
    logger({
      category: "agent",
      message: `Found ${functionCalls.length} function calls, converted to ${actions.length} actions`,
      level: 2,
    });

    // Check if task is completed
    const completed =
      functionCalls.length === 0 ||
      (candidate.finishReason && candidate.finishReason !== "STOP");

    return {
      actions,
      message: message.trim(),
      completed,
      functionCalls,
    };
  }

  /**
   * Convert Google function call to Stagehand action
   */
  private convertFunctionCallToAction(
    functionCall: FunctionCall,
  ): AgentAction | null {
    const { name, args } = functionCall;

    if (!name || !args) {
      return null;
    }

    switch (name) {
      case "open_web_browser":
        return {
          type: "open_web_browser",
          timestamp: Date.now(),
        };

      case "click_at": {
        const { x, y } = this.normalizeCoordinates(
          args.x as number,
          args.y as number,
        );
        return {
          type: "click",
          x,
          y,
          button: args.button || "left",
        };
      }

      case "type_text_at": {
        const { x, y } = this.normalizeCoordinates(
          args.x as number,
          args.y as number,
        );
        // Google's type_text_at includes press_enter and clear_before_typing parameters
        const pressEnter = (args.press_enter as boolean) ?? false;
        const clearBeforeTyping = (args.clear_before_typing as boolean) ?? true;

        // For type_text_at, we need to click first then type
        // This matches the behavior expected by Google's CUA
        // We'll handle this in the executeStep method by converting to two actions
        return {
          type: "type",
          text: args.text as string,
          x,
          y,
          pressEnter,
          clearBeforeTyping,
        };
      }

      case "key_combination": {
        const keys = (args.keys as string)
          .split("+")
          .map((key: string) => key.trim())
          .map((key: string) => mapKeyToPlaywright(key));
        return {
          type: "keypress",
          keys,
        };
      }

      case "scroll_document": {
        const direction = (args.direction as string).toLowerCase();
        return {
          type: "keypress",
          keys: [direction === "up" ? "PageUp" : "PageDown"],
        };
      }

      case "scroll_at": {
        const { x, y } = this.normalizeCoordinates(
          args.x as number,
          args.y as number,
        );
        const direction = ((args.direction as string) || "down").toLowerCase();
        const magnitude =
          typeof args.magnitude === "number" ? (args.magnitude as number) : 800;

        let scroll_x = 0;
        let scroll_y = 0;
        if (direction === "up") {
          scroll_y = -magnitude;
        } else if (direction === "down") {
          scroll_y = magnitude;
        } else if (direction === "left") {
          scroll_x = -magnitude;
        } else if (direction === "right") {
          scroll_x = magnitude;
        } else {
          // Default to down if unknown direction
          scroll_y = magnitude;
        }

        return {
          type: "scroll",
          x,
          y,
          scroll_x,
          scroll_y,
        };
      }

      case "navigate":
        return {
          type: "goto",
          url: args.url as string,
        };

      case "go_back":
        return {
          type: "back",
        };

      case "go_forward":
        return {
          type: "forward",
        };

      case "wait_5_seconds":
        return {
          type: "wait",
          timeMs: 5000, // Google CUA waits for 5 seconds
        };

      case "hover_at": {
        const { x, y } = this.normalizeCoordinates(
          args.x as number,
          args.y as number,
        );
        return {
          type: "move",
          x,
          y,
        };
      }

      case "search":
        return {
          type: "goto",
          url: "https://www.google.com",
        };

      case "drag_and_drop": {
        const startPoint = this.normalizeCoordinates(
          args.x as number,
          args.y as number,
        );
        const endPoint = this.normalizeCoordinates(
          args.destination_x as number,
          args.destination_y as number,
        );
        return {
          type: "drag",
          path: [
            { x: startPoint.x, y: startPoint.y },
            { x: endPoint.x, y: endPoint.y },
          ],
        };
      }

      default:
        if (isCustomTool(functionCall, this.tools)) {
          return {
            type: "custom_tool",
            name,
            arguments: args,
            timestamp: Date.now(),
            pageUrl: this.currentUrl,
          };
        }
        console.warn(`Unsupported Google CUA function: ${name}`);
        return null;
    }
  }

  /**
   * Normalize coordinates from Google's 0-1000 range to viewport dimensions
   */
  private normalizeCoordinates(x: number, y: number): { x: number; y: number } {
    const clampedX = Math.min(999, Math.max(0, x));
    const clampedY = Math.min(999, Math.max(0, y));
    return {
      x: Math.floor((clampedX / 1000) * this.currentViewport.width),
      y: Math.floor((clampedY / 1000) * this.currentViewport.height),
    };
  }

  async captureScreenshot(options?: {
    base64Image?: string;
    currentUrl?: string;
  }): Promise<string> {
    // Update current URL if provided
    if (options?.currentUrl) {
      this.currentUrl = options.currentUrl;
    }

    // Use provided options if available
    if (options?.base64Image) {
      return `data:image/png;base64,${options.base64Image}`;
    }

    // Use the screenshot provider if available
    if (this.screenshotProvider) {
      try {
        const base64Image = await this.screenshotProvider();
        return `data:image/png;base64,${base64Image}`;
      } catch (error) {
        console.error("Error capturing screenshot:", error);
        throw error;
      }
    }

    throw new AgentScreenshotProviderError(
      "`screenshotProvider` has not been set. " +
        "Please call `setScreenshotProvider()` with a valid function that returns a base64-encoded image",
    );
  }
}


================================================
FILE: packages/core/lib/v3/agent/MicrosoftCUAClient.ts
================================================
import OpenAI from "openai";
import { LogLine } from "../types/public/logs.js";
import {
  AgentAction,
  AgentResult,
  AgentType,
  AgentExecutionOptions,
} from "../types/public/agent.js";
import { ClientOptions } from "../types/public/model.js";
import { AgentClient } from "./AgentClient.js";
import { AgentScreenshotProviderError } from "../types/public/sdkErrors.js";
import { mapKeyToPlaywright } from "./utils/cuaKeyMapping.js";
import { ChatCompletionMessageParam } from "openai/resources/chat/completions";

/**
 * Message types for FARA agent
 */
interface FaraMessage {
  role: "system" | "user" | "assistant";
  content: string | FaraMessageContent[];
}

interface FaraMessageContent {
  type: "text" | "image_url";
  text?: string;
  image_url?: {
    url: string; // data:image/png;base64,...
  };
}

/**
 * FARA function call structure (parsed from XML tags)
 */
interface FaraFunctionCall {
  name: string; // Always "computer_use"
  arguments: {
    action: string;
    thoughts?: string;
    [key: string]: unknown;
  };
}

/**
 * Client for FARA (Function-based Autonomous Research Agent) by Microsoft
 * This implementation uses OpenAI-compatible API with XML-based tool calling
 */
export class MicrosoftCUAClient extends AgentClient {
  private apiKey: string;
  private baseURL: string;
  private client: OpenAI;
  private currentViewport = { width: 1288, height: 711 };
  private currentUrl?: string;
  private screenshotProvider?: () => Promise<string>;
  private actionHandler?: (action: AgentAction) => Promise<void>;

  // Dual history system
  private conversationHistory: FaraMessage[] = []; // Conceptual flow
  private actionHistory: FaraMessage[] = []; // Raw model responses

  private maxImages: number = 3;
  private temperature: number = 0;
  private facts: string[] = [];

  // FARA-specific MLM processor config
  private readonly MLM_PROCESSOR_IM_CFG = {
    min_pixels: 3136,
    max_pixels: 12845056,
    patch_size: 14,
    merge_size: 2,
  };

  // Resized dimensions for model input
  private resizedViewport = { width: 1288, height: 711 };

  constructor(
    type: AgentType,
    modelName: string,
    userProvidedInstructions?: string,
    clientOptions?: ClientOptions,
  ) {
    super(type, modelName || "fara-7b", userProvidedInstructions);

    // Process client options
    this.apiKey =
      (clientOptions?.apiKey as string) ||
      process.env.AZURE_API_KEY ||
      process.env.FIREWORKS_API_KEY ||
      "";
    this.baseURL =
      (clientOptions?.baseURL as string) ||
      process.env.AZURE_ENDPOINT ||
      process.env.FIREWORKS_ENDPOINT ||
      "";

    // Store client options for reference
    this.clientOptions = {
      apiKey: this.apiKey,
      baseURL: this.baseURL,
    };

    // Validate API key
    if (!this.apiKey || this.apiKey === "") {
      throw new Error(
        "API key is required. Please provide it via clientOptions.apiKey or AZURE_API_KEY or FIREWORKS_API_KEY environment variables.",
      );
    }

    // Initialize the OpenAI client (FARA uses OpenAI-compatible API)
    this.client = new OpenAI({
      apiKey: this.apiKey,
      baseURL: this.baseURL,
    });

    // Max images to keep in history
    if (clientOptions?.maxImages !== undefined) {
      this.maxImages = clientOptions.maxImages as number;
    }

    // Temperature
    if (clientOptions?.temperature !== undefined) {
      this.temperature = clientOptions.temperature as number;
    }
  }

  setViewport(width: number, height: number): void {
    this.currentViewport = { width, height };
    // Compute resized viewport using smart_resize logic
    this.resizedViewport = this.smartResize(width, height);
  }

  setCurrentUrl(url: string): void {
    this.currentUrl = url;
  }

  setScreenshotProvider(provider: () => Promise<string>): void {
    this.screenshotProvider = provider;
  }

  setActionHandler(handler: (action: AgentAction) => Promise<void>): void {
    this.actionHandler = handler;
  }

  /**
   * Smart resize algorithm from FARA
   * Ensures dimensions are divisible by factor and within pixel limits
   */
  private smartResize(
    width: number,
    height: number,
  ): { width: number; height: number } {
    const { patch_size, merge_size, min_pixels, max_pixels } =
      this.MLM_PROCESSOR_IM_CFG;
    const factor = patch_size * merge_size;

    const roundByFactor = (num: number, f: number) => Math.round(num / f) * f;
    const ceilByFactor = (num: number, f: number) => Math.ceil(num / f) * f;
    const floorByFactor = (num: number, f: number) => Math.floor(num / f) * f;

    let h_bar = Math.max(factor, roundByFactor(height, factor));
    let w_bar = Math.max(factor, roundByFactor(width, factor));

    if (h_bar * w_bar > max_pixels) {
      const beta = Math.sqrt((height * width) / max_pixels);
      h_bar = floorByFactor(height / beta, factor);
      w_bar = floorByFactor(width / beta, factor);
    } else if (h_bar * w_bar < min_pixels) {
      const beta = Math.sqrt(min_pixels / (height * width));
      h_bar = ceilByFactor(height * beta, factor);
      w_bar = ceilByFactor(width * beta, factor);
    }

    return { width: w_bar, height: h_bar };
  }

  /**
   * Generate system prompt with tool description
   * Simplified to match Python's minimal approach
   */
  private generateSystemPrompt(): string {
    const { width, height } = this.resizedViewport;

    // Base prompt - Minimalist like Python
    let basePrompt = "You are a helpful assistant.";

    // Add user-provided instructions if available
    if (this.userProvidedInstructions) {
      basePrompt = `${basePrompt}\n\n${this.userProvidedInstructions}`;
    }

    // Tool description from FaraComputerUse
    const toolDescription = `Use a mouse and keyboard to interact with a computer, and take screenshots.
* This is an interface to a desktop GUI. You do not have access to a terminal or applications menu. You must click on desktop icons to start applications.
* Some applications may take time to start or process actions, so you may need to wait and take successive screenshots to see the results of your actions. E.g. if you click on Firefox and a window doesn't open, try wait and taking another screenshot.
* The screen's resolution is ${width}x${height}.
* Whenever you intend to move the cursor to click on an element like an icon, you should consult a screenshot to determine the coordinates of the element before moving the cursor.
* If you tried clicking on a program or link but it failed to load, even after waiting, try adjusting your cursor position so that the tip of the cursor visually falls on the element that you want to click.
* Make sure to click any buttons, links, icons, etc with the cursor tip in the center of the element. Don't click boxes on their edges unless asked.
* When a separate scrollable container prominently overlays the webpage, if you want to scroll within it, you typically need to mouse_move() over it first and then scroll().
* If a popup window appears that you want to close, if left_click() on the 'X' or close button doesn't work, try key(keys=['Escape']) to close it.
* On some search bars, when you type(), you may need to press_enter=False and instead separately call left_click() on the search button to submit the search query. This is especially true of search bars that have auto-suggest popups for e.g. locations
* For calendar widgets, you usually need to left_click() on arrows to move between months and left_click() on dates to select them; type() is not typically used to input dates there.`;

    // Tool parameters description
    const actionsDescription = `The action to perform. The available actions are:
* \`key\`: Performs key down presses on the arguments passed in order, then performs key releases in reverse order. Includes "Enter", "Alt", "Shift", "Tab", "Control", "Backspace", "Delete", "Escape", "ArrowUp", "ArrowDown", "ArrowLeft", "ArrowRight", "PageDown", "PageUp", "Shift", etc.
* \`type\`: Type a string of text on the keyboard.
* \`mouse_move\`: Move the cursor to a specified (x, y) pixel coordinate on the screen.
* \`left_click\`: Click the left mouse button.
* \`scroll\`: Performs a scroll of the mouse scroll wheel.
* \`history_back\`: Go back to the previous page in the browser history.
* \`pause_and_memorize_fact\`: Pause and memorize a fact for future reference.
* \`visit_url\`: Visit a specified URL.
* \`web_search\`: Perform a web search with a specified query.
* \`wait\`: Wait specified seconds for the change to happen.
* \`terminate\`: Terminate the current task and report its completion status.`;

    // Tool JSON schema
    const toolSchema = {
      name: "computer_use",
      description: toolDescription,
      parameters: {
        type: "object",
        required: ["action"],
        properties: {
          action: {
            type: "string",
            description: actionsDescription,
            enum: [
              "key",
              "type",
              "mouse_move",
              "left_click",
              "scroll",
              "visit_url",
              "web_search",
              "history_back",
              "pause_and_memorize_fact",
              "wait",
              "terminate",
            ],
          },
          keys: {
            type: "array",
            description: "Required only by `action=key`.",
          },
          text: {
            type: "string",
            description: "Required only by `action=type`.",
          },
          press_enter: {
            type: "boolean",
            description:
              "Whether to press the Enter key after typing. Required only by `action=type`.",
          },
          delete_existing_text: {
            type: "boolean",
            description:
              "Whether to delete existing text before typing. Required only by `action=type`.",
          },
          coordinate: {
            type: "array",
            description:
              "(x, y): The x (pixels from the left edge) and y (pixels from the top edge) coordinates to move the mouse to. Required only by `action=left_click`, `action=mouse_move`, and `action=type`.",
          },
          pixels: {
            type: "number",
            description:
              "The amount of scrolling to perform. Positive values scroll up, negative values scroll down. Required only by `action=scroll`.",
          },
          fact: {
            type: "string",
            description:
              "The fact to remember for the future. Required only by `action=pause_and_memorize_fact`.",
          },
          time: {
            type: "number",
            description: "The seconds to wait. Required only by `action=wait`.",
          },
          status: {
            type: "string",
            description:
              "The status of the task. Required only by `action=terminate`.",
            enum: ["success", "failure"],
          },
        },
      },
    };

    // Format as FARA function calling template (FN_CALL_TEMPLATE format)
    const toolDescs = JSON.stringify(toolSchema, null, 2);
    const functionCallTemplate = `
You are provided with function signatures within <tools></tools> XML tags:
<tools>
${toolDescs}
</tools>

For each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:
<tool_call>
{{"name": <function-name>, "arguments": <args-json-object>}}
</tool_call>`;

    return `${basePrompt}\n\n${functionCallTemplate}`;
  }

  /**
   * Parse thoughts and action from model response
   * FARA uses XML-based tool calling: <tool_call>\n{...}\n</tool_call>
   */
  private parseThoughtsAndAction(response: string): {
    thoughts: string;
    functionCall: FaraFunctionCall;
  } {
    try {
      const parts = response.split("<tool_call>\n");
      const thoughts = parts[0].trim();
      const actionText = parts[1].split("\n</tool_call>")[0].trim();

      let parsedAction;
      try {
        parsedAction = JSON.parse(actionText);
      } catch (jsonError) {
        // Fix common malformed JSON: double opening brackets {{"name": ...}}
        // This happens when the model adds an extra opening brace
        if (actionText.startsWith("{{") && actionText.endsWith("}")) {
          // Remove the extra opening brace
          const fixedText = actionText.slice(1);
          try {
            parsedAction = JSON.parse(fixedText);
          } catch (retryError) {
            throw new Error(
              `Failed to parse action text even after fixing double brackets. Original: ${actionText}. Fixed: ${fixedText}. Error: ${retryError}`,
              { cause: retryError },
            );
          }
        } else {
          throw new Error(
            `Failed to parse action text as JSON: ${actionText}. Error: ${jsonError}`,
            { cause: jsonError },
          );
        }
      }

      return {
        thoughts,
        functionCall: {
          name: parsedAction.name || "computer_use",
          arguments: {
            ...parsedAction.arguments,
            thoughts,
          },
        },
      };
    } catch (error) {
      throw new Error(
        `Failed to parse FARA tool call from response: ${response}. Error: ${error}`,
        { cause: error },
      );
    }
  }

  /**
   * Convert FARA function call to Stagehand AgentAction
   */
  private convertFunctionCallToAction(
    functionCall: FaraFunctionCall,
  ): AgentAction {
    const args = functionCall.arguments;
    const action = args.action as string;

    // Transform coordinates from resized to original viewport
    const transformCoordinate = (coord: number[]): number[] => {
      if (!coord || coord.length !== 2) return coord;
      const [x, y] = coord;
      const scaleX = this.currentViewport.width / this.resizedViewport.width;
      const scaleY = this.currentViewport.height / this.resizedViewport.height;
      return [Math.round(x * scaleX), Math.round(y * scaleY)];
    };

    const baseAction = {
      type: action,
      reasoning: args.thoughts as string,
    };

    switch (action) {
      case "left_click": {
        const clickCoord = transformCoordinate(args.coordinate as number[]);
        return {
          ...baseAction,
          type: "click",
          x: clickCoord[0],
          y: clickCoord[1],
          button: "left" as const,
        };
      }

      case "mouse_move": {
        const moveCoord = transformCoordinate(args.coordinate as number[]);
        return {
          ...baseAction,
          type: "move",
          coordinate: moveCoord,
        };
      }

      case "type": {
        const typeCoord = args.coordinate
          ? transformCoordinate(args.coordinate as number[])
          : undefined;
        return {
          ...baseAction,
          text: args.text as string,
          ...(typeCoord && { x: typeCoord[0], y: typeCoord[1] }),
          press_enter:
            args.press_enter !== undefined
              ? (args.press_enter as boolean)
              : true,
          ...(args.delete_existing_text !== undefined && {
            delete_existing_text: args.delete_existing_text as boolean,
          }),
        };
      }

      case "key":
      case "keypress": {
        const keys = (args.keys as string[]) || [];
        // Normalize keys to Playwright format
        const normalizedKeys = keys.map((k) => mapKeyToPlaywright(k));
        return {
          ...baseAction,
          type: "keypress",
          keys: normalizedKeys,
        };
      }

      case "scroll": {
        const pixels = (args.pixels as number) || 0;
        // FARA: positive = scroll up, negative = scroll down
        // Convert to scroll_x/scroll_y
        return {
          ...baseAction,
          scroll_x: 0,
          scroll_y: -pixels, // Invert: negative pixels = scroll down
        };
      }

      case "visit_url": {
        let url = args.url as string;
        // Enhanced URL processing like Python
        if (
          !url.startsWith("https://") &&
          !url.startsWith("http://") &&
          !url.startsWith("file://") &&
          !url.startsWith("about:")
        ) {
          // If URL contains space, treat as search query
          if (url.includes(" ")) {
            url = `https://www.bing.com/search?q=${encodeURIComponent(url)}&FORM=QBLH`;
          } else {
            // Otherwise prefix with https://
            url = "https://" + url;
          }
        }
        return {
          ...baseAction,
          type: "goto",
          url,
        };
      }

      case "web_search": {
        // Convert web search to visit_url with Bing search
        const query = args.query as string;
        const searchUrl = `https://www.bing.com/search?q=${encodeURIComponent(query)}&FORM=QBLH`;
        return {
          ...baseAction,
          type: "goto",
          url: searchUrl,
        };
      }

      case "history_back":
        return {
          ...baseAction,
          type: "back",
        };

      case "wait": {
        // Support both 'time' and 'duration' parameters with default (matches Python)
        const durationSeconds =
          (args.time as number) || (args.duration as number) || 3.0;
        return {
          ...baseAction,
          timeMs: durationSeconds * 1000, // Convert seconds to ms
        };
      }

      case "pause_and_memorize_fact": {
        // Store the fact for future reference (matches Python)
        const fact = args.fact as string;
        this.facts.push(fact);
        return {
          ...baseAction,
          fact,
        };
      }

      case "terminate":
        return {
          ...baseAction,
          status: args.status as string,
        };

      default:
        return {
          ...baseAction,
          ...args,
        };
    }
  }

  /**
   * Capture a screenshot and return as base64 data URL
   */
  async captureScreenshot(): Promise<string> {
    if (!this.screenshotProvider) {
      throw new AgentScreenshotProviderError("Screenshot provider not set");
    }

    const base64Screenshot = await this.screenshotProvider();
    return `data:image/png;base64,${base64Screenshot}`;
  }

  /**
   * Remove old screenshots from history
   * Matches Python's maybe_remove_old_screenshots
   */
  private maybeRemoveOldScreenshots(
    history: FaraMessage[],
    includesCurrent: boolean = false,
  ): FaraMessage[] {
    if (this.maxImages <= 0) {
      return history;
    }

    const maxImages = includesCurrent ? this.maxImages : this.maxImages - 1;
    const newHistory: FaraMessage[] = [];
    let nImages = 0;

    // Iterate backwards
    for (let i = history.length - 1; i >= 0; i--) {
      const msg = history[i];

      // Check if message has image
      let hasImage = false;
      if (Array.isArray(msg.content)) {
        hasImage = msg.content.some((c) => c.type === "image_url");
      }

      if (i === 0 && nImages >= maxImages) {
        // First message (task) - preserve text, remove image
        if (Array.isArray(msg.content)) {
          const newContent = msg.content.filter((c) => c.type !== "image_url");
          // If no content left, skip (unless it's the only message, but Python logic says continue)
          if (newContent.length === 0) {
            continue;
          }
          newHistory.push({ ...msg, content: newContent });
        } else {
          newHistory.push(msg);
        }
        continue;
      }

      if (hasImage) {
        if (nImages < maxImages) {
          newHistory.push(msg);
          nImages++;
        } else {
          // Remove image, keep text
          if (Array.isArray(msg.content)) {
            const newContent = msg.content.filter(
              (c) => c.type !== "image_url",
            );
            // If content becomes empty, we can skip this message entirely (unless it's meaningful text)
            // Python logic: if msg is None continue.
            if (newContent.length > 0) {
              newHistory.push({ ...msg, content: newContent });
            }
          } else {
            newHistory.push(msg);
          }
        }
      } else {
        newHistory.push(msg);
      }
    }

    return newHistory.reverse();
  }

  /**
   * Reconstruct history for API call
   * Merges conceptual chat history with raw action history
   */
  private reconstructHistory(): FaraMessage[] {
    const history: FaraMessage[] = [];
    let actionTurn = 0;

    for (let i = 0; i < this.conversationHistory.length; i++) {
      const m = this.conversationHistory[i];
      if (m.role === "assistant") {
        if (actionTurn >= this.actionHistory.length) {
          // Should not happen if synced correctly
          console.warn("OUT OF SYNC: Action history shorter than chat history");
          history.push(m);
        } else {
          history.push(this.actionHistory[actionTurn]);
          actionTurn++;
        }
      } else {
        history.push(m);
      }
    }

    return this.maybeRemoveOldScreenshots(history);
  }

  /**
   * Execute a single step
   */
  private async executeStep(
    logger: (message: LogLine) => void,
    isFirstRound: boolean = false,
  ): Promise<{
    actions: AgentAction[];
    completed: boolean;
    usage: {
      input_tokens: number;
      output_tokens: number;
      inference_time_ms: number;
    };
  }> {
    // Capture screenshot
    const screenshotDataUrl = await this.captureScreenshot();

    // Update conversation history with new screenshot/message
    if (isFirstRound) {
      // First round: modify the last message (initial user instruction) to include screenshot
      const lastMessage =
        this.conversationHistory[this.conversationHistory.length - 1];
      if (lastMessage && lastMessage.role === "user") {
        const originalContent =
          typeof lastMessage.content === "string"
            ? lastMessage.content
            : (lastMessage.content.find((c) => c.type === "text")?.text ??
              "Start task");

        lastMessage.content = [
          {
            type: "image_url",
            image_url: { url: screenshotDataUrl },
          },
          {
            type: "text",
            text: originalContent,
          },
        ];
      }
    } else {
      // Subsequent rounds: add new user message with screenshot
      const userContent: FaraMessageContent[] = [
        {
          type: "image_url",
          image_url: { url: screenshotDataUrl },
        },
      ];

      // Add current URL if available
      let textPrompt =
        "Here is the next screenshot. Think about what to do next.";
      if (this.currentUrl) {
        const trimmedUrl =
          this.currentUrl.length > 100
            ? this.currentUrl.slice(0, 100) + "..."
            : this.currentUrl;
        textPrompt = `Current URL: ${trimmedUrl}\n${textPrompt}`;
      }

      userContent.push({
        type: "text",
        text: textPrompt,
      });

      this.conversationHistory.push({
        role: "user",
        content: userContent,
      });
    }

    // Reconstruct history for model call
    let history = this.reconstructHistory();

    // Prepend system prompt (generated fresh)
    const systemMessage: FaraMessage = {
      role: "system",
      content: this.generateSystemPrompt(),
    };
    history = [systemMessage, ...history];

    // Make API call
    logger({
      category: "agent",
      message: `Making API call to FARA model with ${history.length} messages`,
      level: 2,
    });

    const startTime = Date.now();
    let response;
    try {
      response = await this.client.chat.completions.create({
        model: this.modelName,
        messages: history as unknown as ChatCompletionMessageParam[],
        temperature: this.temperature,
      });
    } catch (apiError) {
      logger({
        category: "agent",
        message: `API call failed: ${apiError instanceof Error ? apiError.message : String(apiError)}`,
        level: 0,
      });
      throw apiError;
    }
    const inferenceTime = Date.now() - startTime;

    logger({
      category: "agent",
      message: `API call completed in ${inferenceTime}ms`,
      level: 2,
    });

    const content = response.choices[0].message.content || "";
    const usage = response.usage || {
      prompt_tokens: 0,
      completion_tokens: 0,
      total_tokens: 0,
    };

    // Add assistant response to both histories
    const assistantMsg: FaraMessage = {
      role: "assistant",
      content,
    };
    this.conversationHistory.push(assistantMsg);
    this.actionHistory.push(assistantMsg);

    logger({
      category: "agent",
      message: `Model response: ${content}`,
      level: 2,
    });

    // Parse tool call
    const { thoughts, functionCall } = this.parseThoughtsAndAction(content);

    logger({
      category: "agent",
      message: `Thoughts: ${thoughts}`,
      level: 2,
    });

    logger({
      category: "agent",
      message: `Action: ${JSON.stringify(functionCall.arguments)}`,
      level: 2,
    });

    // Convert to AgentAction
    const agentAction = this.convertFunctionCallToAction(functionCall);

    // Expand type action into multiple actions if it has coordinates
    const actions: AgentAction[] = [];
    if (
      agentAction.type === "type" &&
      typeof agentAction.x === "number" &&
      typeof agentAction.y === "number"
    ) {
      // First, click at the coordinates to focus the field
      actions.push({
        type: "click",
        x: agentAction.x,
        y: agentAction.y,
        button: "left",
      });

      // If delete_existing_text is true, clear the field first
      if (agentAction.delete_existing_text) {
        actions.push({
          type: "keypress",
          keys: ["Command+A"],
        });
        actions.push({
          type: "keypress",
          keys: ["Backspace"],
        });
      }

      // Add the type action (without coordinates since we already clicked)
      actions.push({
        type: "type",
        text: agentAction.text,
      });

      // If press_enter is true (default), press Enter after typing
      if (agentAction.press_enter !== false) {
        actions.push({
          type: "keypress",
          keys: ["Enter"],
        });
      }
    } else {
      // For all other actions, just add as-is
      actions.push(agentAction);
    }

    // Execute all actions if handler is available
    if (this.actionHandler && agentAction.type !== "terminate") {
      for (const action of actions) {
        await this.actionHandler(action);
      }
    }

    // Check if completed
    const completed = functionCall.arguments.action === "terminate";

    return {
      actions,
      completed,
      usage: {
        input_tokens: usage.prompt_tokens,
        output_tokens: usage.completion_tokens,
        inference_time_ms: inferenceTime,
      },
    };
  }

  /**
   * Execute a task with the FARA CUA
   * This is the main entry point for the agent
   * @implements AgentClient.execute
   */
  async execute(executionOptions: AgentExecutionOptions): Promise<AgentResult> {
    const { options, logger } = executionOptions;
    const { instruction } = options;
    const maxSteps = options.maxSteps || 10;

    let currentStep = 0;
    let completed = false;
    const actions: AgentAction[] = [];
    const messageList: string[] = [];
    let finalMessage: string;
    let totalInputTokens = 0;
    let totalOutputTokens = 0;
    let totalInferenceTime = 0;

    // Initialize conversation with user instruction
    // System prompt is NOT added here, it's added dynamically in executeStep
    this.conversationHistory = [
      {
        role: "user",
        content: instruction,
      },
    ];
    this.actionHistory = [];

    try {
      // Execute steps until completion or max steps reached
      while (!completed && currentStep < maxSteps) {
        await this.preStepHook?.();

        logger({
          category: "agent",
          message: `Executing step ${currentStep + 1}/${maxSteps}`,
          level: 1,
        });

        const isFirstRound = currentStep === 0;
        const result = await this.executeStep(logger, isFirstRound);
        totalInputTokens += result.usage.input_tokens;
        totalOutputTokens += result.usage.output_tokens;
        totalInferenceTime += result.usage.inference_time_ms;

        // Add actions to the list
        actions.push(...result.actions);

        // Update completion status
        completed = result.completed;

        currentStep++;

        // Record message for this step
        const lastAction = result.actions[result.actions.length - 1];
        if (lastAction?.reasoning) {
          messageList.push(lastAction.reasoning);
        }
      }

      // Generate final message
      if (completed) {
        const lastAction = actions[actions.length - 1];
        finalMessage =
          (lastAction as { status?: string })?.status === "success"
            ? "Task completed successfully."
            : "Task completed with failures.";
      } else {
        finalMessage = `Reached maximum steps (${maxSteps}) without completion.`;
      }

      if (messageList.length > 0) {
        finalMessage = `${messageList.join("\n\n")}\n\n${finalMessage}`;
      }

      return {
        success: completed,
        completed,
        message: finalMessage,
        actions,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    } catch (error) {
      logger({
        category: "agent",
        message: `Error during execution: ${error}`,
        level: 0,
      });

      // Rethrow to allow eval runner's retry logic to handle transient errors
      throw error;
    }
  }
}


================================================
FILE: packages/core/lib/v3/agent/OpenAICUAClient.ts
================================================
import OpenAI from "openai";
import { LogLine } from "../types/public/logs.js";
import {
  AgentAction,
  AgentResult,
  AgentType,
  AgentExecutionOptions,
  ResponseInputItem,
  ResponseItem,
  ComputerCallItem,
  FunctionCallItem,
  SafetyCheck,
  SafetyConfirmationHandler,
} from "../types/public/agent.js";
import { ClientOptions } from "../types/public/model.js";
import { AgentClient } from "./AgentClient.js";
import {
  AgentScreenshotProviderError,
  StagehandClosedError,
} from "../types/public/sdkErrors.js";
import { ToolSet } from "ai";
import {
  FlowLogger,
  extractLlmCuaPromptSummary,
  extractLlmCuaResponseSummary,
} from "../flowlogger/FlowLogger.js";
import { v7 as uuidv7 } from "uuid";

/**
 * Client for OpenAI's Computer Use Assistant API
 * This implementation uses the official OpenAI Responses API for Computer Use
 */
const CAPTCHA_PROCEED_TOOL = "captchaSolvedProceed";

export class OpenAICUAClient extends AgentClient {
  private pendingContextNotes: string[] = [];
  private captchaSolvedToolActive = false;
  private apiKey: string;
  private organization?: string;
  private baseURL: string;
  private client: OpenAI;
  public lastResponseId?: string;
  private currentViewport = { width: 1288, height: 711 };
  private currentUrl?: string;
  private screenshotProvider?: () => Promise<string>;
  private actionHandler?: (action: AgentAction) => Promise<void>;
  private reasoningItems: Map<string, ResponseItem> = new Map();
  private environment: string = "browser"; // "browser", "mac", "windows", or "ubuntu"
  private tools?: ToolSet;
  private safetyConfirmationHandler?: SafetyConfirmationHandler;

  constructor(
    type: AgentType,
    modelName: string,
    userProvidedInstructions?: string,
    clientOptions?: ClientOptions,
    tools?: ToolSet,
  ) {
    super(type, modelName, userProvidedInstructions);

    // Process client options
    this.apiKey =
      (clientOptions?.apiKey as string) || process.env.OPENAI_API_KEY || "";
    this.baseURL = (clientOptions?.baseURL as string) || undefined;
    this.organization =
      (clientOptions?.organization as string) || process.env.OPENAI_ORG;

    // Get environment if specified
    if (
      clientOptions?.environment &&
      typeof clientOptions.environment === "string"
    ) {
      this.environment = clientOptions.environment;
    }

    // Store client options for reference
    this.clientOptions = {
      apiKey: this.apiKey,
    };

    if (this.baseURL) {
      this.clientOptions.baseURL = this.baseURL;
    }

    // Initialize the OpenAI client
    this.client = new OpenAI(this.clientOptions);

    this.tools = tools;
  }

  setViewport(width: number, height: number): void {
    this.currentViewport = { width, height };
  }

  setCurrentUrl(url: string): void {
    this.currentUrl = url;
  }

  setScreenshotProvider(provider: () => Promise<string>): void {
    this.screenshotProvider = provider;
  }

  setActionHandler(handler: (action: AgentAction) => Promise<void>): void {
    this.actionHandler = handler;
  }

  setTools(tools: ToolSet): void {
    this.tools = tools;
  }

  setSafetyConfirmationHandler(handler?: SafetyConfirmationHandler): void {
    this.safetyConfirmationHandler = handler;
  }

  addContextNote(note: string): void {
    this.pendingContextNotes.push(note);

    // When a captcha-related note arrives, expose a tool that the model can
    // call instead of asking the user for confirmation.  This replaces
    // fragile English-phrase parsing with a structured tool call.
    if (note.toLowerCase().includes("captcha")) {
      this.captchaSolvedToolActive = true;
    }
  }

  /**
   * Execute a task with the OpenAI CUA
   * This is the main entry point for the agent
   * @implements AgentClient.execute
   */
  async execute(executionOptions: AgentExecutionOptions): Promise<AgentResult> {
    const { options, logger } = executionOptions;
    const { instruction } = options;
    const maxSteps = options.maxSteps || 10;

    let currentStep = 0;
    let completed = false;
    const actions: AgentAction[] = [];
    const messageList: string[] = [];
    let finalMessage = "";
    this.reasoningItems.clear(); // Clear any previous reasoning items

    // Start with the initial instruction
    let inputItems = this.createInitialInputItems(instruction);
    let previousResponseId: string | undefined = undefined;
    let totalInputTokens = 0;
    let totalOutputTokens = 0;
    let totalInferenceTime = 0;

    try {
      // Execute steps until completion or max steps reached
      while (!completed && currentStep < maxSteps) {
        await this.preStepHook?.();

        logger({
          category: "agent",
          message: `Executing step ${currentStep + 1}/${maxSteps}`,
          level: 1,
        });

        const result = await this.executeStep(
          inputItems,
          previousResponseId,
          logger,
        );
        totalInputTokens += result.usage.input_tokens;
        totalOutputTokens += result.usage.output_tokens;
        totalInferenceTime += result.usage.inference_time_ms;

        // Add actions to the list
        actions.push(...result.actions);

        // Update completion status
        completed = result.completed;

        // Store the previous response ID for the next request
        previousResponseId = result.responseId;

        // Update the input items for the next step if we're continuing
        if (!completed) {
          inputItems = result.nextInputItems;
          const contextNotes = this.drainContextNotes();
          if (contextNotes.length > 0) {
            inputItems = [
              ...inputItems,
              ...contextNotes.map((note) => ({
                role: "user" as const,
                content: note,
              })),
            ];
          }
        }

        // Record any message for this step
        if (result.message) {
          messageList.push(result.message);
          finalMessage = result.message;
        }

        // Increment step counter
        currentStep++;
      }

      // Return the final result
      return {
        success: completed,
        actions,
        message: finalMessage,
        completed,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      logger({
        category: "agent",
        message: `Error executing agent task: ${errorMessage}`,
        level: 0,
      });

      return {
        success: false,
        actions,
        message: `Failed to execute task: ${errorMessage}`,
        completed: false,
        usage: {
          input_tokens: totalInputTokens,
          output_tokens: totalOutputTokens,
          inference_time_ms: totalInferenceTime,
        },
      };
    }
  }

  /**
   * Execute a single step of the agent
   * This coordinates the flow: Request → Get Action → Execute Action
   */
  async executeStep(
    inputItems: ResponseInputItem[],
    previousResponseId: string | undefined,
    logger: (message: LogLine) => void,
  ): Promise<{
    actions: AgentAction[];
    message: string;
    completed: boolean;
    nextInputItems: ResponseInputItem[];
    responseId: string;
    usage: {
      input_tokens: number;
      output_tokens: number;
      inference_time_ms: number;
    };
  }> {
    try {
      // Get response from the model
      const result = await this.getAction(inputItems, previousResponseId);
      const output = result.output;
      const responseId = result.responseId;
      const usage = {
        input_tokens: result.usage.input_tokens,
        output_tokens: result.usage.output_tokens,
        inference_time_ms: result.usage.inference_time_ms,
      };

      // Add any reasoning items to our map
      for (const item of output) {
        if (item.type === "reasoning") {
          this.reasoningItems.set(item.id, item);
          logger({
            category: "agent",
            message: `Reasoning: ${String(item.content || "")}`,
            level: 1,
          });
        }
      }

      // Extract actions from the output
      const stepActions: AgentAction[] = [];
      for (const item of output) {
        if (item.type === "computer_call" && this.isComputerCallItem(item)) {
          logger({
            category: "agent",
            message: `Found computer_call: ${item.action.type}, payload: ${JSON.stringify(item.action)}, call_id: ${item.call_id}`,
            level: 2,
          });
          const action = this.convertComputerCallToAction(item);
          if (action) {
            stepActions.push(action);
            logger({
              category: "agent",
              message: `Converted computer_call to action: ${action.type}`,
              level: 2,
            });
          }
        } else if (
          item.type === "function_call" &&
          this.isFunctionCallItem(item)
        ) {
          logger({
            category: "agent",
            message: `Found function_call: ${item.name}, call_id: ${item.call_id}`,
            level: 2,
          });
          const action = this.convertFunctionCallToAction(item);
          if (action) {
            stepActions.push(action);
            logger({
              category: "agent",
              message: `Converted function_call to action: ${action.type}`,
              level: 2,
            });
          }
        }
      }

      // Extract message text
      let message = "";
      for (const item of output) {
        if (item.type === "message") {
          logger({
            category: "agent",
            message: `Found message block`,
            level: 2,
          });
          if (item.content && Array.isArray(item.content)) {
            for (const content of item.content) {
              if (content.type === "output_text" && content.text) {
                message += content.text + "\n";
                logger({
                  category: "agent",
                  message: `Message text: ${String(content.text || "")}`,
                  level: 1,
                });
              }
            }
          }
        }
      }

      // Take actions and get results
      const nextInputItems = await this.takeAction(output, logger);

      // Check if completed
      const completed =
        output.length === 0 ||
        output.every(
          (item) => item.type === "message" || item.type === "reasoning",
        );

      return {
        actions: stepActions,
        message: message.trim(),
        completed,
        nextInputItems,
        responseId,
        usage: usage,
      };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      logger({
        category: "agent",
        message: `Error executing step: ${errorMessage}`,
        level: 0,
      });

      throw error;
    }
  }

  private isComputerCallItem(item: ResponseItem): item is ComputerCallItem {
    return (
      item.type === "computer_call" &&
      "call_id" in item &&
      "action" in item &&
      typeof item.action === "object"
    );
  }

  private async handleSafetyConfirmation(
    pendingSafetyChecks: SafetyCheck[],
    logger: (message: LogLine) => void,
  ): Promise<SafetyCheck[] | undefined> {
    if (this.safetyConfirmationHandler) {
      logger({
        category: "agent",
        message: `Requesting safety confirmation for ${pendingSafetyChecks.length} check(s): ${pendingSafetyChecks.map((c) => c.code).join(", ")}`,
        level: 1,
      });

      const response =
        await this.safetyConfirmationHandler(pendingSafetyChecks);

      if (response.acknowledged) {
        logger({
          category: "agent",
          message: `Safety checks acknowledged by user`,
          level: 1,
        });
        return pendingSafetyChecks;
      } else {
        logger({
          category: "agent",
          message: `Safety checks rejected by user`,
          level: 1,
        });
        return undefined;
      }
    }

    logger({
      category: "agent",
      message: `Auto-acknowledging ${pendingSafetyChecks.length} safety check(s)`,
      level: 2,
    });
    return pendingSafetyChecks;
  }

  private isFunctionCallItem(item: ResponseItem): item is FunctionCallItem {
    return (
      item.type === "function_call" &&
      "call_id" in item &&
      "name" in item &&
      "arguments" in item
    );
  }

  private createInitialInputItems(instruction: string): ResponseInputItem[] {
    // For the initial request, we use a simple array with the user's instruction
    return [
      {
        role: "system",
        content: this.userProvidedInstructions,
      },
      {
        role: "user",
        content: instruction,
      },
    ];
  }

  async getAction(
    inputItems: ResponseInputItem[],
    previousResponseId?: string,
  ): Promise<{
    output: ResponseItem[];
    responseId: string;
    usage: Record<string, number>;
  }> {
    try {
      // Create the request parameters
      const requestParams: Record<string, unknown> = {
        model: this.modelName,
        tools: [
          {
            type: "computer_use_preview",
            display_width: this.currentViewport.width,
            display_height: this.currentViewport.height,
            environment: this.environment,
          },
        ],
        input: inputItems,
        truncation: "auto",
      };

      // Add custom tools if available
      if (this.tools && Object.keys(this.tools).length > 0) {
        const customTools = Object.entries(this.tools).map(([name, tool]) => ({
          type: "function" as const,
          name,
          function: {
            name,
            description: tool.description,
            parameters: tool.inputSchema,
          },
        }));

        requestParams.tools = [
          ...(requestParams.tools as Record<string, unknown>[]),
          ...customTools,
        ];
      }

      // When a captcha was just solved, expose a tool the model can call
      // to confirm it should proceed.  This avoids fragile English-phrase
      // parsing and works regardless of the model's output language.
      if (this.captchaSolvedToolActive) {
        requestParams.tools = [
          ...(requestParams.tools as Record<string, unknown>[]),
          {
            type: "function" as const,
            name: CAPTCHA_PROCEED_TOOL,
            function: {
              name: CAPTCHA_PROCEED_TOOL,
              description:
                "The captcha on this page was solved automatically. " +
                "Call this tool to confirm and continue with your task " +
                "instead of asking the user for permission.",
              parameters: { type: "object", properties: {}, required: [] },
            },
          },
        ];
      }

      // Add previous_response_id if available
      if (previousResponseId) {
        requestParams.previous_response_id = previousResponseId;
      }

      // Log LLM request
      const llmRequestId = uuidv7();
      FlowLogger.logLlmRequest({
        requestId: llmRequestId,
        model: this.modelName,
        prompt: extractLlmCuaPromptSummary(inputItems),
      });

      const startTime = Date.now();
      // Create the response using the OpenAI Responses API
      // @ts-expect-error - Force type to match what the OpenAI SDK expects
      const response = await this.client.responses.create(requestParams);
      const endTime = Date.now();
      const elapsedMs = endTime - startTime;

      // Extract only the input_tokens and output_tokens
      const usage = {
        input_tokens: response.usage.input_tokens,
        output_tokens: response.usage.output_tokens,
        inference_time_ms: elapsedMs,
      };

      // Log LLM response
      FlowLogger.logLlmResponse({
        requestId: llmRequestId,
        model: this.modelName,
        output: extractLlmCuaResponseSummary(response.output),
        inputTokens: response.usage.input_tokens,
        outputTokens: response.usage.output_tokens,
      });

      // Store the response ID for future use
      this.lastResponseId = response.id;

      // Return the output and response ID
      return {
        output: response.output as unknown as ResponseItem[],
        responseId: response.id,
        usage,
      };
    } catch (error) {
      console.error("Error getting action from OpenAI:", error);
      throw error;
    }
  }

  async takeAction(
    output: ResponseItem[],
    logger: (message: LogLine) => void,
  ): Promise<ResponseInputItem[]> {
    const nextInputItems: ResponseInputItem[] = [];

    // Process each output item
    for (const item of output) {
      if (item.type === "computer_call" && this.isComputerCallItem(item)) {
        // Handle computer calls
        try {
          const action = this.convertComputerCallToAction(item);

          if (action && this.actionHandler) {
            logger({
              category: "agent",
              message: `Executing computer action: ${action.type}`,
              level: 1,
            });
            await this.actionHandler(action);
          }

          // Capture a screenshot
          const screenshot = await this.captureScreenshot();

          // Create a computer_call_output for the next request
          const outputItem = {
            type: "computer_call_output" as const,
            call_id: item.call_id,
            output: {
              type: "input_image" as const,
              image_url: screenshot,
            },
          } as ResponseInputItem;

          logger({
            category: "agent",
            message: `Added computer_call_output for call_id: ${item.call_id}`,
            level: 2,
          });

          // Add current URL if available
          if (this.currentUrl) {
            const computerCallOutput = outputItem as {
              type: "computer_call_output";
              call_id: string;
              output: {
                type: "input_image";
                image_url: string;
                current_url?: string;
              };
              acknowledged_safety_checks?: SafetyCheck[];
            };
            computerCallOutput.output.current_url = this.currentUrl;
          }

          if (
            item.pending_safety_checks &&
            item.pending_safety_checks.length > 0
          ) {
            const acknowledgedChecks = await this.handleSafetyConfirmation(
              item.pending_safety_checks,
              logger,
            );

            if (acknowledgedChecks) {
              const computerCallOutput = outputItem as {
                type: "computer_call_output";
                call_id: string;
                output: {
                  type: "input_image";
                  image_url: string;
                };
                acknowledged_safety_checks?: SafetyCheck[];
              };
              computerCallOutput.acknowledged_safety_checks =
                acknowledgedChecks;
            }
          }

          nextInputItems.push(outputItem);
        } catch (error) {
          if (error instanceof StagehandClosedError) {
            throw error;
          }
          const errorMessage =
            error instanceof Error ? error.message : String(error);

          logger({
            category: "agent",
            message: `Error executing computer call: ${errorMessage}`,
            level: 0,
          });

          try {
            // Capture a screenshot even on error
            const screenshot = await this.captureScreenshot();

            const errorOutputItem = {
              type: "computer_call_output" as const,
              call_id: item.call_id,
              output: {
                type: "input_image" as const,
                image_url: screenshot,
                error: errorMessage,
              },
            } as ResponseInputItem;

            // Add current URL if available
            if (this.currentUrl) {
              const computerCallOutput = errorOutputItem as {
                type: "computer_call_output";
                call_id: string;
                output: {
                  type: "input_image";
                  image_url: string;
                  current_url?: string;
                };
                acknowledged_safety_checks?: SafetyCheck[];
              };
              computerCallOutput.output.current_url = this.currentUrl;
            }

            if (
              item.pending_safety_checks &&
              item.pending_safety_checks.length > 0
            ) {
              const acknowledgedChecks = await this.handleSafetyConfirmation(
                item.pending_safety_checks,
                logger,
              );

              if (acknowledgedChecks) {
                const computerCallOutput = errorOutputItem as {
                  type: "computer_call_output";
                  call_id: string;
                  output: {
                    type: "input_image";
                    image_url: string;
                  };
                  acknowledged_safety_checks?: SafetyCheck[];
                };
                computerCallOutput.acknowledged_safety_checks =
                  acknowledgedChecks;
              }
            }

            nextInputItems.push(errorOutputItem);
          } catch (screenshotError) {
            if (screenshotError instanceof StagehandClosedError) {
              throw screenshotError;
            }
            // If we can't capture a screenshot, just send the error
            logger({
              category: "agent",
              message: `Error capturing screenshot: ${String(screenshotError)}`,
              level: 0,
            });

            // For error cases without a screenshot, we need to use a string output
            nextInputItems.push({
              type: "computer_call_output",
              call_id: item.call_id,
              output: `Error: ${errorMessage}`,
            } as ResponseInputItem);
          }
        }
      } else if (
        item.type === "function_call" &&
        this.isFunctionCallItem(item)
      ) {
        // Handle the captcha-proceed tool — just return a confirmation and
        // deactivate the tool so it doesn't appear on subsequent steps.
        if (item.name === CAPTCHA_PROCEED_TOOL) {
          this.captchaSolvedToolActive = false;
          nextInputItems.push({
            type: "function_call_output",
            call_id: item.call_id,
            output:
              "Confirmed. The captcha is solved. Continue completing the original task autonomously without asking for further confirmation.",
          } as ResponseInputItem);
          continue;
        }

        // Handle function calls (tool calls)
        try {
          const action = this.convertFunctionCallToAction(item);

          if (action && this.actionHandler) {
            await this.actionHandler(action);
          }

          // Execute the tool if available
          let toolResult = "Tool executed successfully";
          if (this.tools && item.name in this.tools) {
            try {
              const tool = this.tools[item.name];
              const args = JSON.parse(item.arguments);

              logger({
                category: "agent",
                message: `Executing tool call: ${item.name} with args: ${item.arguments}`,
                level: 1,
              });

              const result = await tool.execute(args, {
                toolCallId: item.call_id,
                messages: [],
              });
              toolResult = JSON.stringify(result);

              logger({
                category: "agent",
                message: `Tool ${item.name} completed successfully. Result: ${toolResult}`,
                level: 1,
              });
            } catch (toolError) {
              const errorMessage =
                toolError instanceof Error
                  ? toolError.message
                  : String(toolError);
              toolResult = `Error executing tool: ${errorMessage}`;

              logger({
                category: "agent",
                message: `Error executing tool ${item.name}: ${errorMessage}`,
                level: 0,
              });
            }
          }

          // Create a function_call_output for the next request
          const outputItem: ResponseInputItem = {
            type: "function_call_output",
            call_id: item.call_id,
            output: toolResult,
          };

          nextInputItems.push(outputItem);
        } catch (error) {
          if (error instanceof StagehandClosedError) {
            throw error;
          }
          const errorMessage =
            error instanceof Error ? error.message : String(error);

          logger({
            category: "agent",
            message: `Error executing function call: ${errorMessage}`,
            level: 0,
          });

          // Send error result back
          const errorOutputItem: ResponseInputItem = {
            type: "function_call_output",
            call_id: item.call_id,
            output: `Error: ${errorMessage}`,
          };

          nextInputItems.push(errorOutputItem);
        }
      }
    }

    return nextInputItems;
  }

  private convertComputerCallToAction(
    call: ComputerCallItem,
  ): AgentAction | null {
    const { action } = call;

    // Instead of wrapping the action in a params object, spread the action properties directly
    // This ensures properties like x, y, button, etc. are directly accessible on the AgentAction
    return {
      type: action.type as string,
      ...action, // Spread all properties from the action
    };
  }

  private drainContextNotes(): string[] {
    if (this.pendingContextNotes.length === 0) {
      return [];
    }

    const notes = [...this.pendingContextNotes];
    this.pendingContextNotes = [];
    return notes;
  }

  private convertFunctionCallToAction(
    call: FunctionCallItem,
  ): AgentAction | null {
    try {
      const args = JSON.parse(call.arguments);

      return {
        type: call.name,
        params: args,
      };
    } catch (error) {
      console.error("Error parsing function call arguments:", error);
      return null;
    }
  }

  async captureScreenshot(options?: {
    base64Image?: string;
    currentUrl?: string;
  }): Promise<string> {
    // Use provided options if available
    if (options?.base64Image) {
      return `data:image/png;base64,${options.base64Image}`;
    }

    // Use the screenshot provider if available
    if (this.screenshotProvider) {
      try {
        const base64Image = await this.screenshotProvider();
        return `data:image/png;base64,${base64Image}`;
      } catch (error) {
        console.error("Error capturing screenshot:", error);
        throw error;
      }
    }

    throw new AgentScreenshotProviderError(
      "`screenshotProvider` has not been set. " +
        "Please call `setScreenshotProvider()` with a valid function that returns a base64-encoded image",
    );
  }
}


================================================
FILE: packages/core/lib/v3/agent/prompts/agentSystemPrompt.ts
================================================
import type { AgentToolMode, Variables } from "../../types/public/agent.js";
import { CAPTCHA_SYSTEM_PROMPT_NOTE } from "../utils/captchaSolver.js";

export interface AgentSystemPromptOptions {
  url: string;
  executionInstruction: string;
  mode: AgentToolMode;
  systemInstructions?: string;
  /** Whether captchas are automatically solved by the browser environment */
  captchasAutoSolve?: boolean;
  /** Tools to exclude from the system prompt */
  excludeTools?: string[];
  /** Variables available to the agent for use in act/type tools */
  variables?: Variables;
  /** Whether the search tool is enabled for this execution */
  useSearch?: boolean;
}

/**
 * Builds the system prompt for the agent based on the tool mode.
 *
 * @param options - The prompt configuration options
 * @returns The formatted system prompt string
 */
interface ToolDefinition {
  name: string;
  description: string;
}

function buildToolsSection(
  isHybridMode: boolean,
  hasSearch: boolean,
  excludeTools?: string[],
): string {
  const excludeSet = new Set(excludeTools ?? []);

  const hybridTools: ToolDefinition[] = [
    {
      name: "screenshot",
      description: "Take a compressed JPEG screenshot for quick visual context",
    },
    {
      name: "ariaTree",
      description:
        "Get an accessibility (ARIA) hybrid tree for full page context",
    },
    {
      name: "click",
      description:
        "Click on an element (PREFERRED - more reliable when element is visible in viewport)",
    },
    {
      name: "type",
      description:
        "Type text into an element (PREFERRED - more reliable when element is visible in viewport)",
    },
    {
      name: "act",
      description:
        "Perform a specific atomic action (click, type, etc.) - ONLY use when element is in ariaTree but NOT visible in screenshot. Less reliable but can interact with out-of-viewport elements.",
    },
    { name: "dragAndDrop", description: "Drag and drop an element" },
    { name: "clickAndHold", description: "Click and hold on an element" },
    { name: "keys", description: "Press a keyboard key" },
    {
      name: "fillFormVision",
      description: "Fill out a form using coordinates",
    },
    { name: "think", description: "Think about the task" },
    { name: "extract", description: "Extract structured data" },
    { name: "goto", description: "Navigate to a URL" },
    { name: "wait", description: "Wait for a specified time" },
    { name: "navback", description: "Navigate back in browser history" },
    { name: "scroll", description: "Scroll the page x pixels up or down" },
  ];

  const domTools: ToolDefinition[] = [
    {
      name: "screenshot",
      description: "Take a compressed JPEG screenshot for quick visual context",
    },
    {
      name: "ariaTree",
      description:
        "Get an accessibility (ARIA) hybrid tree for full page context",
    },
    {
      name: "act",
      description: "Perform a specific atomic action (click, type)",
    },
    { name: "keys", description: "Press a keyboard key" },
    { name: "fillForm", description: "Fill out a form" },
    { name: "think", description: "Think about the task" },
    { name: "extract", description: "Extract structured data" },
    { name: "goto", description: "Navigate to a URL" },
    { name: "wait", description: "Wait for a specified time" },
    { name: "navback", description: "Navigate back in browser history" },
    { name: "scroll", description: "Scroll the page x pixels up or down" },
  ];

  const baseTools = isHybridMode ? hybridTools : domTools;

  if (hasSearch) {
    baseTools.push({
      name: "search",
      description:
        "Perform a web search and return results. Prefer this over navigating to Google and searching within the page for reliability and efficiency.",
    });
  }

  const filteredTools = baseTools.filter((tool) => !excludeSet.has(tool.name));

  const toolLines = filteredTools
    .map((tool) => `    <tool name="${tool.name}">${tool.description}</tool>`)
    .join("\n");

  return `<tools>\n${toolLines}\n  </tools>`;
}

export function buildAgentSystemPrompt(
  options: AgentSystemPromptOptions,
): string {
  const {
    url,
    executionInstruction,
    mode,
    systemInstructions,
    captchasAutoSolve = false,
    excludeTools,
    variables,
    useSearch = false,
  } = options;
  const localeDate = new Date().toLocaleDateString();
  const isoDate = new Date().toISOString();
  const cdata = (text: string) => `<![CDATA[${text}]]>`;

  const isHybridMode = mode === "hybrid";
  const hasSearch = useSearch || Boolean(process.env.BRAVE_API_KEY);

  // Tools section differs based on mode and excluded tools
  const toolsSection = buildToolsSection(isHybridMode, hasSearch, excludeTools);

  // Strategy differs based on mode
  const strategyItems = isHybridMode
    ? [
        `<item>Tool selection priority: Use specific tools (click, type) when elements are visible in viewport for maximum reliability.</item>`,
        `<item>Always use screenshot to get proper grounding of the coordinates you want to type/click into.</item>`,
        `<item>When interacting with an input, always use the type tool to type into the input, over clicking and then typing into it.</item>`,
        `<item>Use ariaTree as a secondary tool when elements aren't visible in screenshot or to get full page context.</item>`,
        `<item>Only use act when element is in ariaTree but NOT visible in screenshot.</item>`,
      ]
    : [
        `<item>Tool selection priority: Use act tool for all clicking and typing on a page.</item>`,
        `<item>Always check ariaTree first to understand full page content without scrolling - it shows all elements including those below the fold.</item>`,
        `<item>When interacting with an input, always use the act tool to type into the input, over clicking and then typing.</item>`,
        `<item>If an element is present in the ariaTree, use act to interact with it directly - this eliminates the need to scroll.</item>`,
        `<item>Use screenshot for visual confirmation when needed, but rely primarily on ariaTree for element detection.</item>`,
      ];

  const strategySection = strategyItems.join("\n    ");

  const commonStrategyItems = `
    <item>CRITICAL: Use extract ONLY when the task explicitly requires structured data output (e.g., "get job listings", "extract product details"). For reading page content or understanding elements, always use ${isHybridMode ? "screenshot or ariaTree" : "ariaTree"} instead - it's faster and more reliable.</item>
    <item>Keep actions atomic and verify outcomes before proceeding.</item>
    <item>For each action, provide clear reasoning about why you're taking that step.</item>
    <item>When you need to input text that could be entered character-by-character or through multiple separate inputs, prefer using the keys tool to type the entire sequence at once. This is more efficient for scenarios like verification codes split across multiple fields, or when virtual keyboards are present but direct typing would be faster.</item>
    `;

  // Page understanding protocol differs based on mode
  const pageUnderstandingProtocol = isHybridMode
    ? `<page_understanding_protocol>
    <step_1>
      <title>UNDERSTAND THE PAGE</title>
      <primary_tool>
        <name>screenshot</name>
        <usage>Visual confirmation when needed. Ideally after navigating to a new page.</usage>
        </primary_tool>
      <secondary_tool>
        <name>ariaTree</name>
        <usage>Get complete page context before taking actions</usage>
        <benefit>Eliminates the need to scroll and provides full accessible content</benefit>
      </secondary_tool>
    </step_1>
  </page_understanding_protocol>`
    : `<page_understanding_protocol>
    <step_1>
      <title>UNDERSTAND THE PAGE</title>
      <primary_tool>
        <name>ariaTree</name>
        <usage>Get complete page context before taking actions</usage>
        <benefit>Eliminates the need to scroll and provides full accessible content</benefit>
        </primary_tool>
      <secondary_tool>
        <name>screenshot</name>
        <usage>Visual confirmation when needed. Ideally after navigating to a new page.</usage>
      </secondary_tool>
    </step_1>
  </page_understanding_protocol>`;

  // Roadblocks section only shown when captchas are auto-solved
  const roadblocksSection = captchasAutoSolve
    ? `<roadblocks>
    <note>${CAPTCHA_SYSTEM_PROMPT_NOTE}</note>
  </roadblocks>`
    : "";

  // Build customInstructions block only if provided
  const customInstructionsBlock = systemInstructions
    ? `<customInstructions>${cdata(systemInstructions)}</customInstructions>\n  `
    : "";

  // Build variables section only if variables are provided
  const hasVariables = variables && Object.keys(variables).length > 0;
  const variableToolsNote = isHybridMode
    ? "Use %variableName% syntax in the type, fillFormVision, or act tool's value/text/action fields."
    : "Use %variableName% syntax in the act or fillForm tool's action fields.";
  const variablesSection = hasVariables
    ? `<variables>
    <note>You have access to the following variables. Use %variableName% syntax to substitute variable values. This is especially important for sensitive data like passwords.</note>
    <usage>${variableToolsNote}</usage>
    <example>To type a password, use: type %password% into the password field</example>
    ${Object.entries(variables)
      .map(([name, v]) => {
        const description =
          typeof v === "object" && v !== null && "value" in v
            ? v.description
            : undefined;
        return description
          ? `<variable name="${name}">${description}</variable>`
          : `<variable name="${name}" />`;
      })
      .join("\n    ")}
  </variables>`
    : "";

  return `<system>
  <identity>You are a web automation assistant using browser automation tools to accomplish the user's goal.</identity>
  ${customInstructionsBlock}<task>
    <goal>${cdata(executionInstruction)}</goal>
    <date display="local" iso="${isoDate}">${localeDate}</date>
    <note>You may think the date is different due to knowledge cutoff, but this is the actual date.</note>
  </task>
  <page>
    <startingUrl>you are starting your task on this url: ${url}</startingUrl>
  </page>
  <mindset>
    <note>Be very intentional about your action. The initial instruction is very important, and slight variations of the actual goal can lead to failures.</note>
    <importantNote>If something fails to meet a single condition of the task, move on from it rather than seeing if it meets other criteria. We only care that it meets all of it</importantNote>
    <note>When the task is complete, do not seek more information; you have completed the task.</note>
  </mindset>
  <guidelines>
    <item>Always start by understanding the current page state</item>
    <item>Use the screenshot tool to verify page state when needed</item>
    <item>Use appropriate tools for each action</item>
  </guidelines>
  ${pageUnderstandingProtocol}
  <navigation>
    <rule>If you are confident in the URL, navigate directly to it.</rule>
    ${hasSearch ? `<rule>If you are not confident in the URL, use the search tool to find it.</rule>` : ``}
  </navigation>
  ${toolsSection}
  <strategy>
    ${strategySection}
    ${commonStrategyItems}
  </strategy>
  ${roadblocksSection}
  ${variablesSection}
  <completion>
    <note>When you complete the task, explain any information that was found that was relevant to the original task.</note>
    <examples>
      <example>If you were asked for specific flights, list the flights you found.</example>
      <example>If you were asked for information about a product, list the product information you were asked for.</example>
    </examples>
  </completion>
</system>`;
}


================================================
FILE: packages/core/lib/v3/agent/tools/README.md
================================================
This folder provides v3-native agent tools for the AISDK-based agent flow.
They mirror the v2 tools but operate on the V3 CDP-native APIs.

Files are placed under lib/v3/agent/tools and consumed by V3AgentHandler.


================================================
FILE: packages/core/lib/v3/agent/tools/act.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import type { AgentModelConfig, Variables } from "../../types/public/agent.js";
import { TimeoutError } from "../../types/public/sdkErrors.js";

export const actTool = (
  v3: V3,
  executionModel?: string | AgentModelConfig,
  variables?: Variables,
  toolTimeout?: number,
) => {
  const hasVariables = variables && Object.keys(variables).length > 0;
  const actionDescription = hasVariables
    ? `Describe what to click or type, e.g. "click the Login button" or "type %variableName% into the input". Available variables: ${Object.keys(variables).join(", ")}`
    : 'Describe what to click or type, e.g. "click the Login button" or "type "John" into the first name input"';

  return tool({
    description:
      "Perform an action on the page (click, type). Provide a short, specific phrase that mentions the element type.",
    inputSchema: z.object({
      action: z.string().describe(actionDescription),
    }),
    execute: async ({ action }) => {
      try {
        v3.logger({
          category: "agent",
          message: `Agent calling tool: act`,
          level: 1,
          auxiliary: {
            arguments: {
              value: action,
              type: "string",
            },
          },
        });
        const options = executionModel
          ? { model: executionModel, variables, timeout: toolTimeout }
          : { variables, timeout: toolTimeout };

        const result = await v3.act(action, options);
        const actions = (result.actions as Action[] | undefined) ?? [];
        v3.recordAgentReplayStep({
          type: "act",
          instruction: action,
          actions,
          actionDescription: result.actionDescription,
          message: result.message,
        });
        // Only include playwrightArguments when actions exist
        // (undefined is not valid JSON and breaks AI SDK validation)
        const response: {
          success: boolean;
          action: string;
          playwrightArguments?: Action;
        } = {
          success: result.success ?? true,
          action: result?.actionDescription ?? action,
        };
        if (actions.length > 0) {
          response.playwrightArguments = actions[0];
        }
        return response;
      } catch (error) {
        if (error instanceof TimeoutError) {
          throw error;
        }
        return {
          success: false,
          error: error?.message ?? String(error),
        };
      }
    },
  });
};


================================================
FILE: packages/core/lib/v3/agent/tools/ariaTree.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import { TimeoutError } from "../../types/public/sdkErrors.js";

export const ariaTreeTool = (v3: V3, toolTimeout?: number) =>
  tool({
    description:
      "gets the accessibility (ARIA) hybrid tree text for the current page. use this to understand structure and content.",
    inputSchema: z.object({}),
    execute: async () => {
      try {
        v3.logger({
          category: "agent",
          message: `Agent calling tool: ariaTree`,
          level: 1,
        });
        const page = await v3.context.awaitActivePage();
        const extractOptions = toolTimeout
          ? { timeout: toolTimeout }
          : undefined;
        const { pageText } = (await v3.extract(extractOptions)) as {
          pageText: string;
        };
        const pageUrl = page.url();

        let content = pageText;
        const MAX_TOKENS = 70000; // rough cap, assume ~4 chars per token for conservative truncation
        const estimatedTokens = Math.ceil(content.length / 4);
        if (estimatedTokens > MAX_TOKENS) {
          const maxChars = MAX_TOKENS * 4;
          content =
            content.substring(0, maxChars) +
            "\n\n[CONTENT TRUNCATED: Exceeded 70,000 token limit]";
        }

        return { success: true, content, pageUrl };
      } catch (error) {
        if (error instanceof TimeoutError) {
          throw error;
        }
        return {
          content: "",
          error: error?.message ?? String(error),
          success: false,
          pageUrl: "",
        };
      }
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      return {
        type: "content",
        value: [
          { type: "text", text: `Accessibility Tree:\n${result.content}` },
        ],
      };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/braveSearch.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";

export interface BraveSearchResult {
  title: string;
  url: string;
  description?: string;
}

interface SearchResponse {
  data?: {
    results: BraveSearchResult[];
  };
  error?: string;
}

interface BraveWebResult {
  title?: string;
  url?: string;
  description?: string;
  age?: string;
  meta_url?: {
    favicon?: string;
  };
}

interface BraveApiResponse {
  web?: {
    results?: BraveWebResult[];
  };
}

async function performBraveSearch(query: string): Promise<SearchResponse> {
  try {
    const encodedQuery = encodeURIComponent(query);
    const response = await fetch(
      `https://api.search.brave.com/res/v1/web/search?q=${encodedQuery}`,
      {
        method: "GET",
        headers: {
          Accept: "application/json",
          "Accept-Encoding": "gzip",
          "X-Subscription-Token": process.env.BRAVE_API_KEY!,
        },
      },
    );

    if (!response.ok) {
      return {
        error: `Brave API error: ${response.status} ${response.statusText}`,
        data: { results: [] },
      };
    }

    const data = (await response.json()) as BraveApiResponse;
    const results: BraveSearchResult[] = [];

    if (data?.web?.results && Array.isArray(data.web.results)) {
      for (const item of data.web.results.slice(0, 5)) {
        if (item.title && item.url) {
          results.push({
            title: item.title,
            url: item.url,
            description: item.description,
          });
        }
      }
    }

    return { data: { results } };
  } catch (error) {
    console.error("Search error", error);
    return {
      error: `Error performing search: ${error.message}`,
      data: { results: [] },
    };
  }
}

export const searchTool = (v3: V3) =>
  tool({
    description:
      "Perform a web search and returns results. Use this tool when you need information from the web or when you are unsure of the exact URL you want to navigate to. This can be used to find the ideal entry point, resulting in a task that is easier to complete due to starting further in the process.",
    inputSchema: z.object({
      query: z.string().describe("The search query to look for on the web"),
    }),
    execute: async ({ query }) => {
      v3.logger({
        category: "agent",
        message: `Agent calling tool: search`,
        level: 1,
        auxiliary: {
          arguments: {
            value: JSON.stringify({ query }),
            type: "object",
          },
        },
      });

      const result = await performBraveSearch(query);

      v3.recordAgentReplayStep({
        type: "search",
        instruction: query,
        playwrightArguments: { query },
        message:
          result.error ?? `Found ${result.data?.results.length ?? 0} results`,
      });

      return {
        ...result,
        timestamp: Date.now(),
      };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/browserbaseSearch.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";

export interface SearchResult {
  title: string;
  url: string;
  publishedDate?: string;
}

interface BrowserbaseRawResult {
  title?: string;
  url?: string;
  publishedDate?: string;
}

interface BrowserbaseApiResponse {
  results?: BrowserbaseRawResult[];
}

async function performBrowserbaseSearch(
  v3: V3,
  query: string,
  apiKey: string,
  numResults: number = 5,
): Promise<{ results: SearchResult[]; error?: string }> {
  try {
    const response = await fetch("https://api.browserbase.com/v1/search", {
      method: "POST",
      headers: {
        "Content-Type": "application/json",
        "x-bb-api-key": apiKey,
      },
      body: JSON.stringify({ query, numResults }),
    });

    if (!response.ok) {
      return {
        results: [],
        error: `Browserbase Search API error: ${response.status} ${response.statusText}`,
      };
    }

    const data = (await response.json()) as BrowserbaseApiResponse;
    const results: SearchResult[] = (data?.results ?? []).map(
      ({ title, url, publishedDate }) => ({
        title: title,
        url: url,
        ...(publishedDate && { publishedDate }),
      }),
    );

    return { results };
  } catch (error) {
    v3.logger({
      category: "agent",
      message: `Search error: ${error.message}`,
      level: 0,
    });
    return {
      results: [],
      error: `Error performing search: ${error.message}`,
    };
  }
}

export const searchTool = (v3: V3, apiKey: string) =>
  tool({
    description:
      "Perform a web search and returns results. Use this tool when you need information from the web or when you are unsure of the exact URL you want to navigate to. This can be used to find the ideal entry point, resulting in a task that is easier to complete due to starting further in the process.",
    inputSchema: z.object({
      query: z.string().describe("The search query to look for on the web"),
    }),
    execute: async ({ query }) => {
      v3.logger({
        category: "agent",
        message: `Agent calling tool: search`,
        level: 1,
        auxiliary: {
          arguments: {
            value: JSON.stringify({ query }),
            type: "object",
          },
        },
      });

      const result = await performBrowserbaseSearch(v3, query, apiKey);

      v3.recordAgentReplayStep({
        type: "search",
        instruction: query,
        playwrightArguments: { query },
        message: result.error ?? `Found ${result.results.length} results`,
      });

      return { ...result, timestamp: Date.now() };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/click.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import type {
  ClickToolResult,
  ModelOutputContentItem,
} from "../../types/public/agent.js";
import { processCoordinates } from "../utils/coordinateNormalization.js";
import { ensureXPath } from "../utils/xpath.js";
import { waitAndCaptureScreenshot } from "../utils/screenshotHandler.js";

export const clickTool = (v3: V3, provider?: string) =>
  tool({
    description:
      "Click on an element using its coordinates (this is the most reliable way to click on an element, always use this over act, unless the element is not visible in the screenshot, but shown in ariaTree)",
    inputSchema: z.object({
      describe: z
        .string()
        .describe(
          "Describe the element to click on in a short, specific phrase that mentions the element type and a good visual description",
        ),
      coordinates: z
        .array(z.number())
        .describe("The (x, y) coordinates to click on"),
    }),
    execute: async ({ describe, coordinates }): Promise<ClickToolResult> => {
      try {
        const page = await v3.context.awaitActivePage();
        const processed = processCoordinates(
          coordinates[0],
          coordinates[1],
          provider,
          v3,
        );

        v3.logger({
          category: "agent",
          message: `Agent calling tool: click`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify({ describe }),
              type: "object",
            },
          },
        });

        // Only request XPath when caching is enabled to avoid unnecessary computation
        const shouldCollectXpath = v3.isAgentReplayActive();
        const xpath = await page.click(processed.x, processed.y, {
          returnXpath: shouldCollectXpath,
        });

        const screenshotBase64 = await waitAndCaptureScreenshot(page);

        // Record as an "act" step with proper Action for deterministic replay (only when caching)
        if (shouldCollectXpath) {
          const normalizedXpath = ensureXPath(xpath);
          if (normalizedXpath) {
            const action: Action = {
              selector: normalizedXpath,
              description: describe,
              method: "click",
              arguments: [],
            };
            v3.recordAgentReplayStep({
              type: "act",
              instruction: describe,
              actions: [action],
              actionDescription: describe,
            });
          }
        }

        return {
          success: true,
          describe,
          coordinates: [processed.x, processed.y],
          screenshotBase64,
        };
      } catch (error) {
        return {
          success: false,
          error: `Error clicking: ${error.message}`,
        };
      }
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      const content: ModelOutputContentItem[] = [
        {
          type: "text",
          text: JSON.stringify({
            success: result.success,
            describe: result.describe,
            coordinates: result.coordinates,
          }),
        },
      ];
      if (result.screenshotBase64) {
        content.push({
          type: "media",
          mediaType: "image/png",
          data: result.screenshotBase64,
        });
      }
      return { type: "content", value: content };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/clickAndHold.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import { processCoordinates } from "../utils/coordinateNormalization.js";
import { ensureXPath } from "../utils/xpath.js";

export const clickAndHoldTool = (v3: V3, provider?: string) =>
  tool({
    description: "Click and hold on an element using its coordinates",
    inputSchema: z.object({
      describe: z
        .string()
        .describe(
          "Describe the element to click on in a short, specific phrase that mentions the element type and a good visual description",
        ),
      duration: z
        .number()
        .describe("The duration to hold the element in milliseconds"),
      coordinates: z
        .array(z.number())
        .describe("The (x, y) coordinates to click on"),
    }),
    execute: async ({ describe, coordinates, duration }) => {
      try {
        const page = await v3.context.awaitActivePage();
        const processed = processCoordinates(
          coordinates[0],
          coordinates[1],
          provider,
          v3,
        );

        v3.logger({
          category: "agent",
          message: `Agent calling tool: clickAndHold`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify({
                describe,
                duration,
              }),
              type: "object",
            },
          },
        });

        // Only request XPath when caching is enabled to avoid unnecessary computation
        const shouldCollectXpath = v3.isAgentReplayActive();

        // Use dragAndDrop from same point to same point with delay to simulate click and hold
        const [xpath] = await page.dragAndDrop(
          processed.x,
          processed.y,
          processed.x,
          processed.y,
          { delay: duration, returnXpath: shouldCollectXpath },
        );

        // Record as "act" step with proper Action for deterministic replay (only when caching)
        if (shouldCollectXpath) {
          const normalizedXpath = ensureXPath(xpath);
          if (normalizedXpath) {
            const action: Action = {
              selector: normalizedXpath,
              description: describe,
              method: "clickAndHold",
              arguments: [String(duration)],
            };
            v3.recordAgentReplayStep({
              type: "act",
              instruction: describe,
              actions: [action],
              actionDescription: describe,
            });
          }
        }

        return { success: true, describe };
      } catch (error) {
        return {
          success: false,
          error: `Error clicking and holding: ${error.message}`,
        };
      }
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/dragAndDrop.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import type {
  DragAndDropToolResult,
  ModelOutputContentItem,
} from "../../types/public/agent.js";
import { processCoordinates } from "../utils/coordinateNormalization.js";
import { ensureXPath } from "../utils/xpath.js";
import { waitAndCaptureScreenshot } from "../utils/screenshotHandler.js";

export const dragAndDropTool = (v3: V3, provider?: string) =>
  tool({
    description:
      "Drag and drop an element using its coordinates (this is the most reliable way to drag and drop an element, always use this over act, unless the element is not visible in the screenshot, but shown in ariaTree)",
    inputSchema: z.object({
      describe: z.string().describe("Describe the element to drag and drop"),
      startCoordinates: z
        .array(z.number())
        .describe("The (x, y) coordinates to start the drag and drop from"),
      endCoordinates: z
        .array(z.number())
        .describe("The (x, y) coordinates to end the drag and drop at"),
    }),
    execute: async ({
      describe,
      startCoordinates,
      endCoordinates,
    }): Promise<DragAndDropToolResult> => {
      try {
        const page = await v3.context.awaitActivePage();
        const processedStart = processCoordinates(
          startCoordinates[0],
          startCoordinates[1],
          provider,
          v3,
        );
        const processedEnd = processCoordinates(
          endCoordinates[0],
          endCoordinates[1],
          provider,
          v3,
        );

        v3.logger({
          category: "agent",
          message: `Agent calling tool: dragAndDrop`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify({
                describe,
              }),
              type: "object",
            },
          },
        });

        // Only request XPath when caching is enabled to avoid unnecessary computation
        const shouldCollectXpath = v3.isAgentReplayActive();
        const [fromXpath, toXpath] = await page.dragAndDrop(
          processedStart.x,
          processedStart.y,
          processedEnd.x,
          processedEnd.y,
          { returnXpath: shouldCollectXpath },
        );

        const screenshotBase64 = await waitAndCaptureScreenshot(page);

        // Record as "act" step with proper Action for deterministic replay (only when caching)
        if (shouldCollectXpath) {
          const normalizedFrom = ensureXPath(fromXpath);
          const normalizedTo = ensureXPath(toXpath);
          if (normalizedFrom && normalizedTo) {
            const action: Action = {
              selector: normalizedFrom,
              description: describe,
              method: "dragAndDrop",
              arguments: [normalizedTo],
            };
            v3.recordAgentReplayStep({
              type: "act",
              instruction: describe,
              actions: [action],
              actionDescription: describe,
            });
          }
        }

        return {
          success: true,
          describe,
          screenshotBase64,
        };
      } catch (error) {
        return {
          success: false,
          error: `Error dragging: ${error.message}`,
        };
      }
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      const content: ModelOutputContentItem[] = [
        {
          type: "text",
          text: JSON.stringify({
            success: result.success,
            describe: result.describe,
          }),
        },
      ];
      if (result.screenshotBase64) {
        content.push({
          type: "media",
          mediaType: "image/png",
          data: result.screenshotBase64,
        });
      }
      return { type: "content", value: content };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/extract.ts
================================================
import { tool } from "ai";
import { z, ZodTypeAny } from "zod";
import type { V3 } from "../../v3.js";
import type { AgentModelConfig } from "../../types/public/agent.js";
import { TimeoutError } from "../../types/public/sdkErrors.js";

interface JsonSchema {
  type?: string;
  properties?: Record<string, JsonSchema>;
  items?: JsonSchema;
  enum?: string[];
  format?: "url" | "email" | "uuid";
}

function jsonSchemaToZod(schema: JsonSchema): ZodTypeAny {
  switch (schema.type) {
    case "object": {
      const shape: Record<string, ZodTypeAny> = {};
      if (schema.properties) {
        for (const [key, value] of Object.entries(schema.properties)) {
          shape[key] = jsonSchemaToZod(value);
        }
      }
      return z.object(shape);
    }
    case "array":
      return z.array(schema.items ? jsonSchemaToZod(schema.items) : z.any());
    case "string": {
      let s = z.string();
      if (schema.format === "url") s = s.url();
      if (schema.format === "email") s = s.email();
      if (schema.format === "uuid") s = s.uuid();
      if (schema.enum && schema.enum.length > 0)
        return z.enum(schema.enum as [string, ...string[]]);
      return s;
    }
    case "number":
    case "integer":
      return z.number();
    case "boolean":
      return z.boolean();
    case "null":
      return z.null();
    default:
      return z.any();
  }
}

export const extractTool = (
  v3: V3,
  executionModel?: string | AgentModelConfig,
  toolTimeout?: number,
) =>
  tool({
    description: `Extract structured data from the current page based on a provided schema.
    
    USAGE GUIDELINES:
    - Keep schemas MINIMAL - only include fields essential for the task
    - IMPORTANT: only use this if explicitly asked for structured output. In most scenarios, you should use the aria tree tool over this.
    - For URL fields, use format: "url"
    
    EXAMPLES:
    1. Extract a single value:
       instruction: "extract the product price"
       schema: { type: "object", properties: { price: { type: "number" } } }
    
    2. Extract multiple fields:
       instruction: "extract product name and price"
       schema: { type: "object", properties: { name: { type: "string" }, price: { type: "number" } } }
    
    3. Extract arrays:
       instruction: "extract all product names and prices"
       schema: { type: "object", properties: { products: { type: "array", items: { type: "object", properties: { name: { type: "string" }, price: { type: "number" } } } } } }
    
    4. Extract a URL:
       instruction: "extract the link"
       schema: { type: "object", properties: { url: { type: "string", format: "url" } } }`,
    inputSchema: z.object({
      instruction: z.string(),
      schema: z
        .object({
          type: z.string().optional(),
          properties: z.record(z.string(), z.unknown()).optional(),
          items: z.unknown().optional(),
          enum: z.array(z.string()).optional(),
          format: z.enum(["url", "email", "uuid"]).optional(),
        })
        .passthrough()
        .optional()
        .describe("JSON Schema object describing the structure to extract"),
    }),
    execute: async ({ instruction, schema }) => {
      try {
        const parsedSchema = schema
          ? jsonSchemaToZod(schema as JsonSchema)
          : undefined;
        const result = await v3.extract(instruction, parsedSchema, {
          ...(executionModel ? { model: executionModel } : {}),
          timeout: toolTimeout,
        });
        return { success: true, result };
      } catch (error) {
        if (error instanceof TimeoutError) {
          throw error;
        }
        return { success: false, error: error?.message ?? String(error) };
      }
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/fillFormVision.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import type {
  FillFormVisionToolResult,
  ModelOutputContentItem,
  Variables,
} from "../../types/public/agent.js";
import { processCoordinates } from "../utils/coordinateNormalization.js";
import { ensureXPath } from "../utils/xpath.js";
import { waitAndCaptureScreenshot } from "../utils/screenshotHandler.js";
import { substituteVariables } from "../utils/variables.js";

export const fillFormVisionTool = (
  v3: V3,
  provider?: string,
  variables?: Variables,
) => {
  const hasVariables = variables && Object.keys(variables).length > 0;
  const valueDescription = hasVariables
    ? `Text to type into the target field. Use %variableName% to substitute a variable value. Available: ${Object.keys(variables).join(", ")}`
    : "Text to type into the target field";

  return tool({
    description: `FORM FILL - SPECIALIZED MULTI-FIELD INPUT TOOL

CRITICAL: Use this for ANY form with 2+ input fields (text inputs, textareas, etc.)
IMPORTANT: Ensure the fields are visible within the current viewport

WHY THIS TOOL EXISTS:
- Forms are the #1 use case for multi-field input
- Optimized specifically for input/textarea elements
- 4-6x faster than individual typing actions

Use fillFormVision: Pure form filling (inputs, textareas only)
MANDATORY USE CASES (always use fillFormVision for these):
- Registration forms: name, email, password fields
- Contact forms: name, email, message fields
- Checkout forms: address, payment info fields
- Profile updates: multiple user data fields
- Search filters: multiple criteria inputs`,
    inputSchema: z.object({
      fields: z
        .array(
          z.object({
            action: z
              .string()
              .describe(
                "Description of the typing action, e.g. 'type foo into the bar field'",
              ),
            value: z.string().describe(valueDescription),
            coordinates: z
              .object({
                x: z.number(),
                y: z.number(),
              })
              .describe("Coordinates of the target field"),
          }),
        )
        .min(2, "Provide at least two fields to fill"),
    }),
    execute: async ({ fields }): Promise<FillFormVisionToolResult> => {
      try {
        const page = await v3.context.awaitActivePage();

        // Process coordinates and substitute variables for each field
        // Keep original values (with %tokens%) for logging/caching, substituted values for typing
        const processedFields = fields.map((field) => {
          const processed = processCoordinates(
            field.coordinates.x,
            field.coordinates.y,
            provider,
            v3,
          );
          return {
            ...field,
            originalValue: field.value, // Keep original with %tokens% for cache
            value: substituteVariables(field.value, variables),
            coordinates: { x: processed.x, y: processed.y },
          };
        });

        v3.logger({
          category: "agent",
          message: `Agent calling tool: fillFormVision`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify({ fields }), // Don't log substituted values
              type: "object",
            },
          },
        });

        // Only request XPath when caching is enabled to avoid unnecessary computation
        const shouldCollectXpath = v3.isAgentReplayActive();
        const actions: Action[] = [];

        for (const field of processedFields) {
          // Click the field, only requesting XPath when caching is enabled
          const xpath = await page.click(
            field.coordinates.x,
            field.coordinates.y,
            {
              returnXpath: shouldCollectXpath,
            },
          );
          await page.type(field.value);

          // Build Action with XPath for deterministic replay (only when caching)
          // Use originalValue (with %tokens%) so cache stores references, not sensitive values
          if (shouldCollectXpath) {
            const normalizedXpath = ensureXPath(xpath);
            if (normalizedXpath) {
              actions.push({
                selector: normalizedXpath,
                description: field.action,
                method: "type",
                arguments: [field.originalValue],
              });
            }
          }

          // Small delay between fields
          await new Promise((resolve) => setTimeout(resolve, 100));
        }

        const screenshotBase64 = await waitAndCaptureScreenshot(page, 100);

        // Record as "act" step with proper Actions for deterministic replay (only when caching)
        if (shouldCollectXpath && actions.length > 0) {
          v3.recordAgentReplayStep({
            type: "act",
            instruction: `Fill ${fields.length} form fields`,
            actions,
            actionDescription: `Fill ${fields.length} form fields`,
          });
        }

        return {
          success: true,
          playwrightArguments: processedFields,
          screenshotBase64,
        };
      } catch (error) {
        return {
          success: false,
          error: `Error filling form: ${error.message}`,
        };
      }
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [
            {
              type: "text",
              text: JSON.stringify({
                success: result.success,
                error: result.error,
              }),
            },
          ],
        };
      }

      const content: ModelOutputContentItem[] = [
        {
          type: "text",
          text: JSON.stringify({
            success: result.success,
            fieldsCount: result.playwrightArguments?.length ?? 0,
          }),
        },
      ];
      if (result.screenshotBase64) {
        content.push({
          type: "media",
          mediaType: "image/png",
          data: result.screenshotBase64,
        });
      }
      return { type: "content", value: content };
    },
  });
};


================================================
FILE: packages/core/lib/v3/agent/tools/fillform.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import type { AgentModelConfig, Variables } from "../../types/public/agent.js";
import { TimeoutError } from "../../types/public/sdkErrors.js";

export const fillFormTool = (
  v3: V3,
  executionModel?: string | AgentModelConfig,
  variables?: Variables,
  toolTimeout?: number,
) => {
  const hasVariables = variables && Object.keys(variables).length > 0;
  const actionDescription = hasVariables
    ? `Must follow the pattern: "type <exact value> into the <field name> <fieldType>". Use %variableName% to substitute a variable value. Available: ${Object.keys(variables).join(", ")}. Examples: "type %email% into the email input", "type %password% into the password input"`
    : 'Must follow the pattern: "type <exact value> into the <field name> <fieldType>". Examples: "type john@example.com into the email input", "type John into the first name input"';

  return tool({
    description:
      'FORM FILL - MULTI-FIELD INPUT TOOL\nFill 2+ form inputs/textareas at once. Each action MUST include the exact text to type and the target field, e.g. "type john@example.com into the email field".',
    inputSchema: z.object({
      fields: z
        .array(
          z.object({
            action: z.string().describe(actionDescription),
          }),
        )
        .min(1, "Provide at least one field to fill"),
    }),
    execute: async ({ fields }) => {
      try {
        v3.logger({
          category: "agent",
          message: `Agent calling tool: fillForm`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify(fields),
              type: "object",
            },
          },
        });
        const instruction = `Return observation results for the following actions: ${fields
          .map((f) => f.action)
          .join(", ")}`;

        const observeOptions = executionModel
          ? { model: executionModel, timeout: toolTimeout }
          : { timeout: toolTimeout };
        const observeResults = await v3.observe(instruction, observeOptions);

        const completed = [] as unknown[];
        const replayableActions: Action[] = [];
        for (const res of observeResults) {
          const actOptions = variables
            ? { variables, timeout: toolTimeout }
            : { timeout: toolTimeout };
          const actResult = await v3.act(res, actOptions);
          completed.push(actResult);
          if (Array.isArray(actResult.actions)) {
            replayableActions.push(...(actResult.actions as Action[]));
          }
        }
        v3.recordAgentReplayStep({
          type: "fillForm",
          fields,
          observeResults,
          actions: replayableActions,
        });
        return {
          success: true,
          actions: completed,
          playwrightArguments: replayableActions,
        };
      } catch (error) {
        if (error instanceof TimeoutError) {
          throw error;
        }
        return {
          success: false,
          error: error?.message ?? String(error),
        };
      }
    },
  });
};


================================================
FILE: packages/core/lib/v3/agent/tools/goto.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";

export const gotoTool = (v3: V3) =>
  tool({
    description: "Navigate to a specific URL",
    inputSchema: z.object({
      url: z.string().describe("The URL to navigate to"),
    }),
    execute: async ({ url }) => {
      try {
        v3.logger({
          category: "agent",
          message: `Agent calling tool: goto`,
          level: 1,
          auxiliary: {
            arguments: {
              value: url,
              type: "string",
            },
          },
        });
        const page = await v3.context.awaitActivePage();
        await page.goto(url, { waitUntil: "load" });
        v3.recordAgentReplayStep({ type: "goto", url, waitUntil: "load" });
        return { success: true, url };
      } catch (error) {
        return { success: false, error: error?.message ?? String(error) };
      }
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/index.ts
================================================
import { gotoTool } from "./goto.js";
import { actTool } from "./act.js";
import { screenshotTool } from "./screenshot.js";
import { waitTool } from "./wait.js";
import { navBackTool } from "./navback.js";
import { ariaTreeTool } from "./ariaTree.js";
import { fillFormTool } from "./fillform.js";
import { scrollTool, scrollVisionTool } from "./scroll.js";
import { extractTool } from "./extract.js";
import { clickTool } from "./click.js";
import { typeTool } from "./type.js";
import { dragAndDropTool } from "./dragAndDrop.js";
import { clickAndHoldTool } from "./clickAndHold.js";
import { keysTool } from "./keys.js";
import { fillFormVisionTool } from "./fillFormVision.js";
import { thinkTool } from "./think.js";
import { searchTool as browserbaseSearchTool } from "./browserbaseSearch.js";
import { searchTool as braveSearchTool } from "./braveSearch.js";

import type { ToolSet, InferUITools } from "ai";
import type { V3 } from "../../v3.js";
import type { LogLine } from "../../types/public/logs.js";
import type {
  AgentToolMode,
  AgentModelConfig,
  Variables,
} from "../../types/public/agent.js";
import { withTimeout } from "../../timeoutConfig.js";
import { TimeoutError } from "../../types/public/sdkErrors.js";

export interface V3AgentToolOptions {
  executionModel?: string | AgentModelConfig;
  logger?: (message: LogLine) => void;
  /**
   * Tool mode determines which set of tools are available.
   * - 'dom' (default): Uses DOM-based tools (act, fillForm) - removes coordinate-based tools
   * - 'hybrid': Uses coordinate-based tools (click, type, dragAndDrop, etc.) - removes fillForm
   */
  mode?: AgentToolMode;
  /**
   * The model provider. Used for model-specific coordinate handling
   */
  provider?: string;
  /**
   * Tools to exclude from the available toolset.
   * These tools will be filtered out after mode-based filtering.
   */
  excludeTools?: string[];
  /**
   * Variables available to the agent for use in act/type tools.
   * When provided, these tools will have an optional useVariable field.
   */
  variables?: Variables;
  /**
   * Timeout in milliseconds for async tool calls.
   * Applied to all tools that perform I/O (except wait and think).
   */
  toolTimeout?: number;
  /**
   * Whether to enable the Browserbase-powered web search tool.
   * Requires a valid Browserbase API key.
   */
  useSearch?: boolean;
  /**
   * The Browserbase API key used for the search tool.
   * Resolved from BROWSERBASE_API_KEY env var or the Stagehand constructor.
   */
  browserbaseApiKey?: string;
}

/**
 * Filters tools based on mode and explicit exclusions.
 * - 'dom' mode: Removes coordinate-based tools (click, type, dragAndDrop, clickAndHold, fillFormVision)
 * - 'hybrid' mode: Removes DOM-based form tool (fillForm) in favor of coordinate-based fillFormVision
 * - excludeTools: Additional tools to remove from the toolset
 */
function filterTools(
  tools: ToolSet,
  mode: AgentToolMode,
  excludeTools?: string[],
): ToolSet {
  const filtered: ToolSet = { ...tools };

  // Mode-based filtering
  if (mode === "hybrid") {
    delete filtered.fillForm;
  } else {
    // DOM mode (default)
    delete filtered.click;
    delete filtered.type;
    delete filtered.dragAndDrop;
    delete filtered.clickAndHold;
    delete filtered.fillFormVision;
  }

  if (excludeTools) {
    for (const toolName of excludeTools) {
      delete filtered[toolName];
    }
  }

  return filtered;
}

/**
 * Wraps an AI SDK tool's execute function with a timeout guard.
 * On timeout, returns `{ success: false, error: "TimeoutError: ..." }` to the LLM
 * and logs the error. Also acts as a safety net for any uncaught errors.
 */
// eslint-disable-next-line @typescript-eslint/no-explicit-any
function wrapToolWithTimeout<T extends Record<string, any>>(
  agentTool: T,
  toolName: string,
  v3: V3,
  timeoutMs?: number,
  timeoutHint?: string,
): T {
  if (!timeoutMs || !agentTool.execute) return agentTool;

  const originalExecute = agentTool.execute;
  return {
    ...agentTool,
    execute: async (...args: unknown[]) => {
      try {
        return await withTimeout(originalExecute(...args), timeoutMs, toolName);
      } catch (error) {
        if (error instanceof TimeoutError) {
          const message = `TimeoutError: ${error.message}${timeoutHint ? ` ${timeoutHint}` : ""}`;
          v3.logger({
            category: "agent",
            message,
            level: 0,
          });
          return {
            success: false,
            error: message,
          };
        }
        throw error;
      }
    },
  } as T;
}

export function createAgentTools(v3: V3, options?: V3AgentToolOptions) {
  const executionModel = options?.executionModel;
  const mode = options?.mode ?? "dom";
  const provider = options?.provider;
  const excludeTools = options?.excludeTools;
  const variables = options?.variables;
  const toolTimeout = options?.toolTimeout;

  const timeoutHints: Record<string, string> = {
    act: "(it may continue executing in the background) — try using a different description for the action",
    ariaTree: "— the page may be too large",
    extract: "— try using a smaller or simpler schema",
    fillForm:
      "(it may continue executing in the background) — try filling fewer fields at once or use a different tool",
  };

  const unwrappedTools: ToolSet = {
    act: actTool(v3, executionModel, variables, toolTimeout),
    ariaTree: ariaTreeTool(v3, toolTimeout),
    click: clickTool(v3, provider),
    clickAndHold: clickAndHoldTool(v3, provider),
    dragAndDrop: dragAndDropTool(v3, provider),
    extract: extractTool(v3, executionModel, toolTimeout),
    fillForm: fillFormTool(v3, executionModel, variables, toolTimeout),
    fillFormVision: fillFormVisionTool(v3, provider, variables),
    goto: gotoTool(v3),
    keys: keysTool(v3),
    navback: navBackTool(v3),
    screenshot: screenshotTool(v3),
    scroll: mode === "hybrid" ? scrollVisionTool(v3, provider) : scrollTool(v3),
    type: typeTool(v3, provider, variables),
  };

  if (options?.useSearch && options.browserbaseApiKey) {
    unwrappedTools.search = browserbaseSearchTool(
      v3,
      options.browserbaseApiKey,
    );
  } else if (process.env.BRAVE_API_KEY) {
    unwrappedTools.search = braveSearchTool(v3);
  }

  const allTools: ToolSet = {
    ...Object.fromEntries(
      Object.entries(unwrappedTools).map(([name, t]) => [
        name,
        wrapToolWithTimeout(
          t,
          `${name}()`,
          v3,
          toolTimeout,
          timeoutHints[name],
        ),
      ]),
    ),
    think: thinkTool(),
    wait: waitTool(v3, mode),
  };

  return filterTools(allTools, mode, excludeTools);
}

export type AgentTools = ReturnType<typeof createAgentTools>;

/**
 * Type map of all agent tools for strong typing of tool calls and results.
 * Note: `search` is optional — enabled via useSearch: true (Browserbase) or BRAVE_API_KEY env var (legacy).
 */
export type AgentToolTypesMap = {
  act: ReturnType<typeof actTool>;
  ariaTree: ReturnType<typeof ariaTreeTool>;
  click: ReturnType<typeof clickTool>;
  clickAndHold: ReturnType<typeof clickAndHoldTool>;
  dragAndDrop: ReturnType<typeof dragAndDropTool>;
  extract: ReturnType<typeof extractTool>;
  fillForm: ReturnType<typeof fillFormTool>;
  fillFormVision: ReturnType<typeof fillFormVisionTool>;
  goto: ReturnType<typeof gotoTool>;
  keys: ReturnType<typeof keysTool>;
  navback: ReturnType<typeof navBackTool>;
  screenshot: ReturnType<typeof screenshotTool>;
  scroll: ReturnType<typeof scrollTool> | ReturnType<typeof scrollVisionTool>;
  search?:
    | ReturnType<typeof browserbaseSearchTool>
    | ReturnType<typeof braveSearchTool>;
  think: ReturnType<typeof thinkTool>;
  type: ReturnType<typeof typeTool>;
  wait: ReturnType<typeof waitTool>;
};

/**
 * Inferred UI tools type for type-safe tool inputs and outputs.
 * Use with UIMessage for full type safety in UI contexts.
 */
export type AgentUITools = InferUITools<AgentToolTypesMap>;

/**
 * Union type for all possible agent tool calls.
 * Provides type-safe access to tool call arguments.
 */
export type AgentToolCall = {
  [K in keyof AgentToolTypesMap]: {
    toolName: K;
    toolCallId: string;
    args: AgentUITools[K]["input"];
  };
}[keyof AgentToolTypesMap];

/**
 * Union type for all possible agent tool results.
 * Provides type-safe access to tool result values.
 */
export type AgentToolResult = {
  [K in keyof AgentToolTypesMap]: {
    toolName: K;
    toolCallId: string;
    result: AgentUITools[K]["output"];
  };
}[keyof AgentToolTypesMap];


================================================
FILE: packages/core/lib/v3/agent/tools/keys.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";

export const keysTool = (v3: V3) =>
  tool({
    description: `Send keyboard input to the page without targeting a specific element. Unlike the type tool which clicks then types into coordinates, this sends keystrokes directly to wherever focus currently is.

Use method="type" to enter text into the currently focused element. Preferred when: input is already focused, text needs to flow across multiple fields (e.g., verification codes)

Use method="press" for navigation keys (Enter, Tab, Escape, Backspace, arrows) and keyboard shortcuts (Cmd+A, Ctrl+C, Shift+Tab).`,
    inputSchema: z.object({
      method: z.enum(["press", "type"]),
      value: z
        .string()
        .describe(
          "The text to type, or the key/combo to press (Enter, Tab, Cmd+A)",
        ),
      repeat: z.number().optional(),
    }),
    execute: async ({ method, value, repeat }) => {
      try {
        const page = await v3.context.awaitActivePage();
        v3.logger({
          category: "agent",
          message: `Agent calling tool: keys`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify({ method, value, repeat }),
              type: "object",
            },
          },
        });

        const times = Math.max(1, repeat ?? 1);

        if (method === "type") {
          for (let i = 0; i < times; i++) {
            await page.type(value, { delay: 100 });
          }
          v3.recordAgentReplayStep({
            type: "keys",
            instruction: `type "${value}"`,
            playwrightArguments: { method, text: value, times },
          });
          return { success: true, method, value, times };
        }

        if (method === "press") {
          for (let i = 0; i < times; i++) {
            await page.keyPress(value, { delay: 100 });
          }
          v3.recordAgentReplayStep({
            type: "keys",
            instruction: `press ${value}`,
            playwrightArguments: { method, keys: value, times },
          });
          return { success: true, method, value, times };
        }

        return { success: false, error: `Unsupported method: ${method}` };
      } catch (error) {
        return { success: false, error: error.message };
      }
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/navback.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";

export const navBackTool = (v3: V3) =>
  tool({
    description: "Navigate back to the previous page",
    inputSchema: z.object({
      reasoningText: z.string().describe("Why you're going back"),
    }),
    execute: async () => {
      v3.logger({
        category: "agent",
        message: `Agent calling tool: navback`,
        level: 1,
      });
      const page = await v3.context.awaitActivePage();
      await page.goBack({ waitUntil: "domcontentloaded" });
      v3.recordAgentReplayStep({
        type: "navback",
        waitUntil: "domcontentloaded",
      });
      return { success: true };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/screenshot.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";

export const screenshotTool = (v3: V3) =>
  tool({
    description:
      "Takes a screenshot (PNG) of the current page. Use this to quickly verify page state.",
    inputSchema: z.object({}),
    execute: async () => {
      try {
        v3.logger({
          category: "agent",
          message: `Agent calling tool: screenshot`,
          level: 1,
        });
        const page = await v3.context.awaitActivePage();
        const buffer = await page.screenshot({ fullPage: false });
        const pageUrl = page.url();
        return {
          success: true,
          base64: buffer.toString("base64"),
          timestamp: Date.now(),
          pageUrl,
        };
      } catch (error) {
        return {
          success: false,
          error: `Error taking screenshot: ${(error as Error).message}`,
        };
      }
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      return {
        type: "content",
        value: [{ type: "media", mediaType: "image/png", data: result.base64 }],
      };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/scroll.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type {
  ScrollToolResult,
  ScrollVisionToolResult,
  ModelOutputContentItem,
} from "../../types/public/agent.js";
import { processCoordinates } from "../utils/coordinateNormalization.js";
import { waitAndCaptureScreenshot } from "../utils/screenshotHandler.js";

/**
 * Simple scroll tool for DOM mode (non-grounding models).
 * No coordinates - scrolls from viewport center.
 */
export const scrollTool = (v3: V3) =>
  tool({
    description:
      "Scroll the page up or down by a percentage of the viewport height. Default is 80%, and what should be typically used for general page scrolling",
    inputSchema: z.object({
      direction: z.enum(["up", "down"]),
      percentage: z.number().min(1).max(200).optional(),
    }),
    execute: async ({
      direction,
      percentage = 80,
    }): Promise<ScrollToolResult> => {
      v3.logger({
        category: "agent",
        message: `Agent calling tool: scroll`,
        level: 1,
        auxiliary: {
          arguments: {
            value: JSON.stringify({ direction, percentage }),
            type: "object",
          },
        },
      });

      const page = await v3.context.awaitActivePage();

      const { w, h } = await page.mainFrame().evaluate<{
        w: number;
        h: number;
      }>("({ w: window.innerWidth, h: window.innerHeight })");

      const scrollDistance = Math.round((h * percentage) / 100);
      const cx = Math.floor(w / 2);
      const cy = Math.floor(h / 2);
      const deltaY = direction === "up" ? -scrollDistance : scrollDistance;

      await page.scroll(cx, cy, 0, deltaY);

      v3.recordAgentReplayStep({
        type: "scroll",
        deltaX: 0,
        deltaY,
        anchor: { x: cx, y: cy },
      });

      return {
        success: true,
        message: `Scrolled ${percentage}% ${direction} (${scrollDistance}px)`,
        scrolledPixels: scrollDistance,
      };
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      return {
        type: "json",
        value: {
          success: result.success,
          message: result.message,
          scrolledPixels: result.scrolledPixels,
        },
      };
    },
  });

/**
 * Scroll tool for hybrid mode (grounding models).
 * Supports optional coordinates for scrolling within nested scrollable elements.
 */
export const scrollVisionTool = (v3: V3, provider?: string) =>
  tool({
    description: `Scroll the page up or down. For general page scrolling, no coordinates needed. Only provide coordinates when scrolling inside a nested scrollable element (e.g., a dropdown menu, modal with overflow, or scrollable sidebar). Default is 80%, and what should be typically used for general page scrolling`,
    inputSchema: z.object({
      direction: z.enum(["up", "down"]),
      coordinates: z
        .array(z.number())
        .optional()
        .describe(
          "Only use coordinates for scrolling inside a nested scrollable element - provide (x, y) within that element",
        ),
      percentage: z.number().min(1).max(200).optional(),
    }),
    execute: async ({
      direction,
      coordinates,
      percentage = 80,
    }): Promise<ScrollVisionToolResult> => {
      const page = await v3.context.awaitActivePage();

      const { w, h } = await page.mainFrame().evaluate<{
        w: number;
        h: number;
      }>("({ w: window.innerWidth, h: window.innerHeight })");

      // Process coordinates if provided, otherwise use viewport center
      let cx: number;
      let cy: number;
      if (coordinates) {
        const processed = processCoordinates(
          coordinates[0],
          coordinates[1],
          provider,
          v3,
        );
        cx = processed.x;
        cy = processed.y;
      } else {
        cx = Math.floor(w / 2);
        cy = Math.floor(h / 2);
      }

      v3.logger({
        category: "agent",
        message: `Agent calling tool: scroll`,
        level: 1,
        auxiliary: {
          arguments: {
            value: JSON.stringify({
              direction,
              coordinates,
              percentage,
              processed: { cx, cy },
            }),
            type: "object",
          },
        },
      });

      const scrollDistance = Math.round((h * percentage) / 100);
      const deltaY = direction === "up" ? -scrollDistance : scrollDistance;

      await page.scroll(cx, cy, 0, deltaY);

      const screenshotBase64 = await waitAndCaptureScreenshot(page, 100);

      v3.recordAgentReplayStep({
        type: "scroll",
        deltaX: 0,
        deltaY,
        anchor: { x: cx, y: cy },
      });

      return {
        success: true,
        message: coordinates
          ? `Scrolled ${percentage}% ${direction} at (${cx}, ${cy})`
          : `Scrolled ${percentage}% ${direction}`,
        scrolledPixels: scrollDistance,
        screenshotBase64,
      };
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      const content: ModelOutputContentItem[] = [
        {
          type: "text",
          text: JSON.stringify({
            success: result.success,
            message: result.message,
            scrolledPixels: result.scrolledPixels,
          }),
        },
      ];
      if (result.screenshotBase64) {
        content.push({
          type: "media",
          mediaType: "image/png",
          data: result.screenshotBase64,
        });
      }
      return { type: "content", value: content };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/think.ts
================================================
import { tool } from "ai";
import { z } from "zod";

export const thinkTool = () =>
  tool({
    description: `Use this tool to think through complex problems or plan a sequence of steps. This is for internal reasoning only and doesn't perform any actions. Use this to:

1. Plan a multi-step approach before taking action
2. Break down complex tasks
3. Reason through edge cases
4. Evaluate options when you're unsure what to do next

The output is only visible to you; use it to track your own reasoning process.`,
    inputSchema: z.object({
      reasoning: z
        .string()
        .describe(
          "Your step-by-step reasoning or planning process. Be as detailed as needed.",
        ),
    }),
    execute: async ({ reasoning }) => {
      return {
        acknowledged: true,
        message: reasoning,
      };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/tools/type.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type { Action } from "../../types/public/methods.js";
import type {
  TypeToolResult,
  ModelOutputContentItem,
  Variables,
} from "../../types/public/agent.js";
import { processCoordinates } from "../utils/coordinateNormalization.js";
import { ensureXPath } from "../utils/xpath.js";
import { waitAndCaptureScreenshot } from "../utils/screenshotHandler.js";
import { substituteVariables } from "../utils/variables.js";

export const typeTool = (v3: V3, provider?: string, variables?: Variables) => {
  const hasVariables = variables && Object.keys(variables).length > 0;
  const textDescription = hasVariables
    ? `The text to type into the element. Use %variableName% to substitute a variable value. Available: ${Object.keys(variables).join(", ")}`
    : "The text to type into the element";

  return tool({
    description:
      "Type text into an element using its coordinates. This will click the element and then type the text into it (this is the most reliable way to type into an element, always use this over act, unless the element is not visible in the screenshot, but shown in ariaTree)",
    inputSchema: z.object({
      describe: z
        .string()
        .describe(
          "Describe the element to type into in a short, specific phrase that mentions the element type and a good visual description",
        ),
      text: z.string().describe(textDescription),
      coordinates: z
        .array(z.number())
        .describe("The (x, y) coordinates to type into the element"),
    }),
    execute: async ({
      describe,
      coordinates,
      text,
    }): Promise<TypeToolResult> => {
      try {
        const page = await v3.context.awaitActivePage();
        const processed = processCoordinates(
          coordinates[0],
          coordinates[1],
          provider,
          v3,
        );

        // Substitute any %variableName% tokens in the text
        const actualText = substituteVariables(text, variables);

        v3.logger({
          category: "agent",
          message: `Agent calling tool: type`,
          level: 1,
          auxiliary: {
            arguments: {
              value: JSON.stringify({ describe, text }),
              type: "object",
            },
          },
        });

        // Only request XPath when caching is enabled to avoid unnecessary computation
        const shouldCollectXpath = v3.isAgentReplayActive();
        const xpath = await page.click(processed.x, processed.y, {
          returnXpath: shouldCollectXpath,
        });

        await page.type(actualText);

        const screenshotBase64 = await waitAndCaptureScreenshot(page);

        // Record as an "act" step with proper Action for deterministic replay (only when caching)
        if (shouldCollectXpath) {
          const normalizedXpath = ensureXPath(xpath);
          if (normalizedXpath) {
            const action: Action = {
              selector: normalizedXpath,
              description: describe,
              method: "type",
              arguments: [text],
            };
            v3.recordAgentReplayStep({
              type: "act",
              instruction: describe,
              actions: [action],
              actionDescription: describe,
            });
          }
        }

        return {
          success: true,
          describe,
          text, // Return original text (with %variableName% tokens) to avoid exposing sensitive values to LLM
          screenshotBase64,
        };
      } catch (error) {
        return {
          success: false,
          error: `Error typing: ${error.message}`,
        };
      }
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      const content: ModelOutputContentItem[] = [
        {
          type: "text",
          text: JSON.stringify({
            success: result.success,
            describe: result.describe,
            text: result.text,
          }),
        },
      ];
      if (result.screenshotBase64) {
        content.push({
          type: "media",
          mediaType: "image/png",
          data: result.screenshotBase64,
        });
      }
      return { type: "content", value: content };
    },
  });
};


================================================
FILE: packages/core/lib/v3/agent/tools/wait.ts
================================================
import { tool } from "ai";
import { z } from "zod";
import type { V3 } from "../../v3.js";
import type {
  AgentToolMode,
  WaitToolResult,
  ModelOutputContentItem,
} from "../../types/public/agent.js";
import { waitAndCaptureScreenshot } from "../utils/screenshotHandler.js";

export const waitTool = (v3: V3, mode?: AgentToolMode) =>
  tool({
    description: "Wait for a specified time",
    inputSchema: z.object({
      timeMs: z.number().describe("Time in milliseconds"),
    }),
    execute: async ({ timeMs }): Promise<WaitToolResult> => {
      v3.logger({
        category: "agent",
        message: `Agent calling tool: wait`,
        level: 1,
        auxiliary: {
          arguments: {
            value: `Waiting for ${timeMs} milliseconds`,
            type: "string",
          },
        },
      });
      await new Promise((resolve) => setTimeout(resolve, timeMs));
      if (timeMs > 0) {
        v3.recordAgentReplayStep({ type: "wait", timeMs });
      }

      // Take screenshot after wait in hybrid mode for visual feedback
      if (mode === "hybrid") {
        const page = await v3.context.awaitActivePage();
        const screenshotBase64 = await waitAndCaptureScreenshot(page, 0);
        return { success: true, waited: timeMs, screenshotBase64 };
      }

      return { success: true, waited: timeMs };
    },
    toModelOutput: (result) => {
      if (result.success === false || result.error !== undefined) {
        return {
          type: "content",
          value: [{ type: "text", text: JSON.stringify(result) }],
        };
      }

      const content: ModelOutputContentItem[] = [
        {
          type: "text",
          text: JSON.stringify({
            success: result.success,
            waited: result.waited,
          }),
        },
      ];
      if (result.screenshotBase64) {
        content.push({
          type: "media",
          mediaType: "image/png",
          data: result.screenshotBase64,
        });
      }
      return { type: "content", value: content };
    },
  });


================================================
FILE: packages/core/lib/v3/agent/utils/actionMapping.ts
================================================
import { AgentAction } from "../../types/public/agent.js";
import { ActionMappingOptions } from "../../types/private/agent.js";

/**
 * Keys to exclude from tool outputs when mapping to actions.
 * These are large data fields that shouldn't be included in the actions array.
 * Users can access this data through result.messages if needed.
 */
const EXCLUDED_OUTPUT_KEYS = ["screenshotBase64"] as const;

/**
 * Strips excluded keys (like screenshotBase64) from a tool output object.
 */
function stripExcludedKeys(
  output: Record<string, unknown>,
): Record<string, unknown> {
  const result: Record<string, unknown> = {};
  for (const [key, value] of Object.entries(output)) {
    if (
      !EXCLUDED_OUTPUT_KEYS.includes(
        key as (typeof EXCLUDED_OUTPUT_KEYS)[number],
      )
    ) {
      result[key] = value;
    }
  }
  return result;
}

export function mapToolResultToActions({
  toolCallName,
  toolResult,
  args,
  reasoning,
}: ActionMappingOptions): AgentAction[] {
  switch (toolCallName) {
    case "act":
      return mapActToolResult(toolResult, args, reasoning);
    case "fillForm":
      return mapFillFormToolResult(toolResult, args, reasoning);
    default:
      return [createStandardAction(toolCallName, toolResult, args, reasoning)];
  }
}

function mapActToolResult(
  toolResult: unknown,
  args: Record<string, unknown>,
  reasoning?: string,
): AgentAction[] {
  if (!toolResult || typeof toolResult !== "object") {
    return [createStandardAction("act", toolResult, args, reasoning)];
  }

  const result = toolResult as Record<string, unknown>;

  // AI SDK wraps the tool result in an output property
  const output = (result.output as Record<string, unknown>) || result;

  // Extract playwright arguments if they exist
  const action: AgentAction = {
    type: "act",
    reasoning,
    taskCompleted: false,
    ...args,
  };

  if (output.playwrightArguments) {
    action.playwrightArguments = output.playwrightArguments;
  }

  return [action];
}

function mapFillFormToolResult(
  toolResult: unknown,
  args: Record<string, unknown>,
  reasoning?: string,
): AgentAction[] {
  if (!toolResult || typeof toolResult !== "object") {
    return [createStandardAction("fillForm", toolResult, args, reasoning)];
  }

  const result = toolResult as Record<string, unknown>;

  // AI SDK wraps the tool result in an output property
  const output = (result.output as Record<string, unknown>) || result;

  const observeResults = Array.isArray(output?.playwrightArguments)
    ? output.playwrightArguments
    : [];

  const actions: AgentAction[] = [];

  actions.push({
    type: "fillForm",
    reasoning,
    taskCompleted: false,
    ...args,
  });

  for (const observeResult of observeResults) {
    actions.push({
      type: "act",
      reasoning: "acting from fillform tool",
      taskCompleted: false,
      playwrightArguments: observeResult,
    });
  }

  return actions;
}

function createStandardAction(
  toolCallName: string,
  toolResult: unknown,
  args: Record<string, unknown>,
  reasoning?: string,
): AgentAction {
  const action: AgentAction = {
    type: toolCallName,
    reasoning,
    taskCompleted:
      toolCallName === "done" ? (args?.taskComplete as boolean) : false,
    ...args,
  };

  // For screenshot tool, exclude base64 data and just indicate a screenshot was taken,
  // if somebody really wants the base64 data, they can access it through messages
  if (toolCallName === "screenshot") {
    action.result = "screenshotTaken";
    return action;
  }

  // Spread the output from the tool result if it exists
  // Exclude ariaTree tool result as it is very large and unnecessary
  if (toolCallName !== "ariaTree" && toolResult) {
    const result = toolResult as { output?: unknown };
    const output = result.output;

    if (output && typeof output === "object" && !Array.isArray(output)) {
      const cleanedOutput = stripExcludedKeys(
        output as Record<string, unknown>,
      );
      Object.assign(action, cleanedOutput);
    }
  }

  return action;
}


================================================
FILE: packages/core/lib/v3/agent/utils/captchaSolver.ts
================================================
import type { Page } from "../../understudy/page.js";
import type { ConsoleMessage } from "../../understudy/consoleMessage.js";

const SOLVING_STARTED = "browserbase-solving-started";
const SOLVING_FINISHED = "browserbase-solving-finished";
const SOLVING_ERRORED = "browserbase-solving-errored";

/** Maximum time (ms) to wait for the captcha solver before giving up. */
const SOLVE_TIMEOUT_MS = 90_000;

// ---------------------------------------------------------------------------
// Shared captcha notification strings
// ---------------------------------------------------------------------------

/** Injected into the agent message stream after a successful captcha solve. */
export const CAPTCHA_SOLVED_MSG =
  "A captcha was automatically detected and solved — no further interaction with the captcha is needed, even if it does not visually appear solved. Do not click the captcha checkbox, widget, or challenge again. Continue with your task.";

/** Injected into the agent message stream when the captcha solver fails. */
export const CAPTCHA_ERRORED_MSG =
  "A captcha was detected but the automatic captcha solver failed to solve it. You may need to try a different approach or navigate around the captcha.";

/** Appended to the system prompt (DOM/hybrid agents) when captchas auto-solve. */
export const CAPTCHA_SYSTEM_PROMPT_NOTE =
  "Captchas on this page are automatically detected and solved by the browser environment. Do not interact with or attempt to solve any captchas yourself — they will be handled for you. Do not click the captcha checkbox, widget, or challenge again after it has been solved, even if it still looks unresolved. Continue with your task as if the captcha does not exist.";

/** Appended to the CUA system prompt when captchas auto-solve. */
export const CAPTCHA_CUA_SYSTEM_PROMPT_NOTE =
  "\n\nCaptchas on this page are automatically detected and solved by the browser environment. Do not interact with or attempt to solve any captchas yourself — they will be handled for you. Continue with your task as if the captcha does not exist.";

/**
 * Tracks Browserbase captcha solver state via console messages and provides
 * a blocking `waitIfSolving()` that agents call before each step/action.
 *
 * Accepts a page-provider callback so the listener is automatically
 * re-attached when the active page changes (e.g. popup / new tab).
 *
 * All concurrent callers of `waitIfSolving()` share the same underlying
 * promise, so multiple waiters are safely resolved together.
 */
export class CaptchaSolver {
  private solving = false;
  private _solvedSinceLastConsume = false;
  private _erroredSinceLastConsume = false;
  private listener: ((msg: ConsoleMessage) => void) | null = null;
  private attachedPage: Page | null = null;
  private pageProvider: (() => Promise<Page>) | null = null;

  /** Shared promise that all concurrent waitIfSolving() callers await. */
  private waitPromise: Promise<void> | null = null;
  /** Resolves the shared waitPromise. */
  private resolveWait: (() => void) | null = null;
  /** Timeout handle for the 90s deadline. */
  private waitTimer: ReturnType<typeof setTimeout> | null = null;

  /**
   * Initialise with a callback that returns the current active page.
   * The listener is lazily (re-)attached whenever the active page changes.
   */
  init(pageProvider: () => Promise<Page>): void {
    this.pageProvider = pageProvider;
  }

  /** Whether a captcha solve is currently in progress. */
  isSolving(): boolean {
    return this.solving;
  }

  /**
   * Ensure the console listener is attached to the current active page.
   * If the active page has changed since the last call, the old listener
   * is removed and a new one is installed.
   */
  async ensureAttached(): Promise<void> {
    if (!this.pageProvider) return;
    const page = await this.pageProvider();
    if (page === this.attachedPage) return;

    // Detach from the old page
    this.detachListener();

    this.attachedPage = page;
    this.listener = (msg: ConsoleMessage) => {
      const text = msg.text();
      if (text === SOLVING_STARTED) {
        this.solving = true;
      } else if (text === SOLVING_FINISHED) {
        this.solving = false;
        this._solvedSinceLastConsume = true;
        this.settle();
      } else if (text === SOLVING_ERRORED) {
        this.solving = false;
        this._erroredSinceLastConsume = true;
        this.settle();
      }
    };
    page.on("console", this.listener);
  }

  /**
   * Returns a promise that resolves immediately if no captcha is being
   * solved, or blocks until the solver finishes, errors, or the 90s
   * timeout is reached.
   *
   * Also re-attaches the listener to the current active page if it has
   * changed since the last call.
   *
   * All concurrent callers share the same promise, so no waiter is
   * orphaned.
   */
  async waitIfSolving(): Promise<void> {
    await this.ensureAttached();

    if (!this.solving) return;

    // Return the existing shared promise if one is already pending
    if (this.waitPromise) return this.waitPromise;

    this.waitPromise = new Promise<void>((resolve) => {
      this.resolveWait = resolve;
      this.waitTimer = setTimeout(() => {
        this.solving = false;
        this._erroredSinceLastConsume = true;
        this.settle();
      }, SOLVE_TIMEOUT_MS);
    });

    return this.waitPromise;
  }

  /**
   * Returns and resets the solve event flags.
   * Call after `waitIfSolving()` to check whether a captcha was solved
   * (or errored) since the last consume.  This captures events even if
   * the solve completed between two `waitIfSolving()` calls.
   */
  consumeSolveResult(): { solved: boolean; errored: boolean } {
    const result = {
      solved: this._solvedSinceLastConsume,
      errored: this._erroredSinceLastConsume,
    };
    this._solvedSinceLastConsume = false;
    this._erroredSinceLastConsume = false;
    return result;
  }

  /**
   * Remove the console listener and reset all state.
   */
  dispose(): void {
    this.detachListener();
    this.attachedPage = null;
    this.pageProvider = null;
    this.solving = false;
    this._solvedSinceLastConsume = false;
    this._erroredSinceLastConsume = false;
    this.settle();
  }

  // ------------------------------------------------------------------
  // Internal helpers
  // ------------------------------------------------------------------

  /** Remove the console listener from the currently attached page. */
  private detachListener(): void {
    if (this.attachedPage && this.listener) {
      this.attachedPage.off("console", this.listener);
    }
    this.listener = null;
    // If a solve was in progress, mark it as errored so consumers
    // know it was interrupted (consistent with the timeout path).
    if (this.solving) {
      this._erroredSinceLastConsume = true;
    }
    // Reset solving state so waiters aren't stuck waiting for events
    // that can never arrive from the detached page.
    this.solving = false;
    this.settle();
  }

  /** Resolve the shared wait promise and clear the timeout. */
  private settle(): void {
    if (this.waitTimer) {
      clearTimeout(this.waitTimer);
      this.waitTimer = null;
    }
    if (this.resolveWait) {
      const resolve = this.resolveWait;
      this.resolveWait = null;
      this.waitPromise = null;
      resolve();
    }
  }
}


================================================
FILE: packages/core/lib/v3/agent/utils/coordinateNormalization.ts
================================================
import type { V3 } from "../../v3.js";

// Default viewport for advancedStealth mode
const STEALTH_VIEWPORT = { width: 1288, height: 711 };

export function isGoogleProvider(provider?: string): boolean {
  if (!provider) return false;
  return provider.toLowerCase().includes("google");
}

// Google returns coordinates in a 0-1000 range, we need to normalize
// them to the viewport dimensions
export function normalizeGoogleCoordinates(
  x: number,
  y: number,
  viewport: { width: number; height: number },
): { x: number; y: number } {
  const clampedX = Math.min(999, Math.max(0, x));
  const clampedY = Math.min(999, Math.max(0, y));
  return {
    x: Math.floor((clampedX / 1000) * viewport.width),
    y: Math.floor((clampedY / 1000) * viewport.height),
  };
}

export function processCoordinates(
  x: number,
  y: number,
  provider?: string,
  v3?: V3,
): { x: number; y: number } {
  if (isGoogleProvider(provider) && v3) {
    // advancedStealth uses fixed viewport, otherwise use configured viewport
    const viewport = v3.isAdvancedStealth
      ? STEALTH_VIEWPORT
      : v3.configuredViewport;
    return normalizeGoogleCoordinates(x, y, viewport);
  }
  return { x, y };
}


================================================
FILE: packages/core/lib/v3/agent/utils/cuaKeyMapping.ts
================================================
/**
 * Universal key mapping utility for converting various key representations
 * to Playwright-compatible key names. Used by all CUA clients and handlers.
 */

/**
 * map of key variations to Playwright key names
 * This handles keys from both Anthropic and OpenAI CUA APIs
 */
const KEY_MAP: Record<string, string> = {
  ENTER: "Enter",
  RETURN: "Enter",
  ESCAPE: "Escape",
  ESC: "Escape",
  BACKSPACE: "Backspace",
  TAB: "Tab",
  SPACE: " ",
  DELETE: "Delete",
  DEL: "Delete",
  ARROWUP: "ArrowUp",
  ARROWDOWN: "ArrowDown",
  ARROWLEFT: "ArrowLeft",
  ARROWRIGHT: "ArrowRight",
  ARROW_UP: "ArrowUp",
  ARROW_DOWN: "ArrowDown",
  ARROW_LEFT: "ArrowLeft",
  ARROW_RIGHT: "ArrowRight",
  UP: "ArrowUp",
  DOWN: "ArrowDown",
  LEFT: "ArrowLeft",
  RIGHT: "ArrowRight",
  SHIFT: "Shift",
  CONTROL: "Control",
  CTRL: "Control",
  ALT: "Alt",
  OPTION: "Alt", // macOS alternative name
  META: "Meta",
  COMMAND: "Meta", // macOS
  CMD: "Meta", // macOS shorthand
  SUPER: "Meta", // Linux
  WINDOWS: "Meta", // Windows
  WIN: "Meta", // Windows shorthand
  HOME: "Home",
  END: "End",
  PAGEUP: "PageUp",
  PAGEDOWN: "PageDown",
  PAGE_UP: "PageUp",
  PAGE_DOWN: "PageDown",
  PGUP: "PageUp",
  PGDN: "PageDown",
};

/**
 * Maps a key name from various formats to Playwright-compatible format
 * @param key The key name in any supported format
 * @returns The Playwright-compatible key name
 */
export function mapKeyToPlaywright(key: string): string {
  if (!key) return key;
  const upperKey = key.toUpperCase();
  return KEY_MAP[upperKey] || key;
}


================================================
FILE: packages/core/lib/v3/agent/utils/googleCustomToolHandler.ts
================================================
import { Part, FunctionCall, FunctionDeclaration, Type } from "@google/genai";
import { ToolSet } from "ai";
import { LogLine } from "../../types/public/logs.js";
import { toJsonSchema } from "../../zodCompat.js";
import type { StagehandZodSchema } from "../../zodCompat.js";

/**
 * Result of executing a custom tool for Google CUA
 */
export interface CustomToolExecutionResult {
  functionResponse: Part;
  success: boolean;
}

/**
 * Execute a custom tool and format the response for Google's API
 * This handles tool execution, result formatting, and error handling
 * specific to Google's function response format
 */
export async function executeGoogleCustomTool(
  toolName: string,
  toolArgs: Record<string, unknown>,
  tools: ToolSet,
  functionCall: FunctionCall,
  logger: (message: LogLine) => void,
): Promise<CustomToolExecutionResult> {
  try {
    logger({
      category: "agent",
      message: `Executing custom tool: ${toolName} with args: ${JSON.stringify(toolArgs)}`,
      level: 1,
    });

    const tool = tools[toolName];
    const toolResult = await tool.execute(toolArgs, {
      toolCallId: `tool_${Date.now()}`,
      messages: [],
    });

    logger({
      category: "agent",
      message: `Tool ${toolName} completed successfully. Result: ${JSON.stringify(toolResult)}`,
      level: 1,
    });

    // Create function response with the result
    const functionResponsePart: Part = {
      functionResponse: {
        name: toolName,
        response: {
          result: JSON.stringify(toolResult),
        },
      },
    };

    return {
      functionResponse: functionResponsePart,
      success: true,
    };
  } catch (toolError) {
    const errorMessage =
      toolError instanceof Error ? toolError.message : String(toolError);

    logger({
      category: "agent",
      message: `Error executing custom tool ${toolName}: ${errorMessage}`,
      level: 0,
    });

    // Create error function response
    const functionResponsePart: Part = {
      functionResponse: {
        name: toolName,
        response: {
          error: errorMessage,
        },
      },
    };

    return {
      functionResponse: functionResponsePart,
      success: false,
    };
  }
}

/**
 * Check if a function call is a custom tool
 */
export function isCustomTool(
  functionCall: FunctionCall,
  tools?: ToolSet,
): boolean {
  return !!(tools && functionCall.name && functionCall.name in tools);
}

/**
 * Convert ToolSet to Google's FunctionDeclaration array
 * Handles the conversion of Zod schemas to Google's parameter format
 */
export function convertToolSetToFunctionDeclarations(
  tools: ToolSet,
): FunctionDeclaration[] {
  const functionDeclarations: FunctionDeclaration[] = [];

  for (const [name, tool] of Object.entries(tools)) {
    const functionDeclaration = convertToolToFunctionDeclaration(name, tool);
    if (functionDeclaration) {
      functionDeclarations.push(functionDeclaration);
    }
  }

  return functionDeclarations;
}

/**
 * Convert a single ToolSet tool to Google's FunctionDeclaration format
 */
function convertToolToFunctionDeclaration(
  name: string,
  tool: { description?: string; inputSchema: unknown },
): FunctionDeclaration | null {
  try {
    // Convert Zod schema to JSON schema
    const schema = tool.inputSchema as StagehandZodSchema;
    const jsonSchema = toJsonSchema(schema) as {
      properties?: Record<string, unknown>;
      required?: string[];
      type?: string;
    };

    const parameters = convertJsonSchemaToGoogleParameters(jsonSchema);

    return {
      name,
      description: tool.description || `Execute ${name}`,
      parameters,
    };
  } catch (error) {
    console.error(
      `Error converting tool ${name} to function declaration:`,
      error,
    );
    return null;
  }
}

/**
 * Convert JSON schema to Google's parameter format
 */
function convertJsonSchemaToGoogleParameters(schema: {
  properties?: Record<string, unknown>;
  required?: string[];
  type?: string;
}): {
  type: Type;
  properties: Record<string, { type: Type; description?: string }>;
  required?: string[];
} {
  const properties: Record<string, { type: Type; description?: string }> = {};

  if (schema.properties) {
    for (const [key, value] of Object.entries(schema.properties)) {
      const propSchema = value as {
        type?: string;
        description?: string;
        items?: { type?: string };
      };
      properties[key] = {
        type: mapJsonTypeToGoogleType(propSchema.type || "string"),
        ...(propSchema.description
          ? { description: propSchema.description }
          : {}),
      };
    }
  }

  return {
    type: Type.OBJECT,
    properties,
    ...(schema.required && schema.required.length > 0
      ? { required: schema.required }
      : {}),
  };
}

/**
 * Map JSON schema types to Google's Type enum
 */
function mapJsonTypeToGoogleType(jsonType: string): Type {
  switch (jsonType.toLowerCase()) {
    case "string":
      return Type.STRING;
    case "number":
    case "integer":
      return Type.NUMBER;
    case "boolean":
      return Type.BOOLEAN;
    case "array":
      return Type.ARRAY;
    case "object":
      return Type.OBJECT;
    default:
      return Type.STRING;
  }
}


================================================
FILE: packages/core/lib/v3/agent/utils/handleDoneToolCall.ts
================================================
import { generateText, ModelMessage, LanguageModel, ToolSet } from "ai";
import { z } from "zod";
import { tool } from "ai";
import { LogLine } from "../../types/public/logs.js";
import { StagehandZodObject } from "../../zodCompat.js";
import { getZFactory } from "../../../utils.js";
import type { StagehandZodSchema } from "../../zodCompat.js";

interface DoneResult {
  reasoning: string;
  taskComplete: boolean;
  messages: ModelMessage[];
  output?: Record<string, unknown>;
}

function buildBaseDoneSchema(factory: typeof z) {
  return factory.object({
    reasoning: factory
      .string()
      .describe("Brief summary of what actions were taken and the outcome"),
    taskComplete: factory
      .boolean()
      .describe("true if the task was fully completed, false otherwise"),
  });
}

/**
 * Force a done tool call at the end of an agent run.
 * This ensures we always get a structured final response,
 * even if the main loop ended without calling done.
 */
export async function handleDoneToolCall(options: {
  model: LanguageModel;
  inputMessages: ModelMessage[];
  instruction: string;
  outputSchema?: StagehandZodObject;
  logger: (message: LogLine) => void;
}): Promise<DoneResult> {
  const { model, inputMessages, instruction, outputSchema, logger } = options;

  logger({
    category: "agent",
    message: "Agent calling tool: done",
    level: 1,
  });
  // Use the same Zod version as the user's outputSchema to avoid v3/v4 mixing
  const factory = outputSchema
    ? getZFactory(outputSchema as StagehandZodSchema)
    : z;
  const baseDoneSchema = buildBaseDoneSchema(factory);

  // Merge base done schema with user-provided output schema if present
  const doneToolSchema = outputSchema
    ? baseDoneSchema.extend({
        output: outputSchema.describe(
          "The specific data the user requested from this task",
        ),
      })
    : baseDoneSchema;

  const outputInstructions = outputSchema
    ? `\n\nThe user also requested the following information from this task. Provide it in the "output" field:\n${JSON.stringify(
        Object.fromEntries(
          Object.entries(outputSchema.shape).map(
            ([key, value]: [string, StagehandZodSchema]) => [
              key,
              value.description || "no description",
            ],
          ),
        ),
        null,
        2,
      )}`
    : "";

  const systemPrompt = `You are a web automation assistant that was tasked with completing a task.

The task was:
"${instruction}"

Review what was accomplished and provide your final assessment in whether the task was completed successfully. you have been provided with the history of the actions taken so far, use this to determine if the task was completed successfully.${outputInstructions}

Call the "done" tool with:
1. A brief summary of what was done
2. Whether the task was completed successfully${outputSchema ? "\n3. The requested output data based on what you found" : ""}`;

  const doneTool = tool({
    description: outputSchema
      ? "Complete the task with your assessment and the requested output data."
      : "Complete the task with your final assessment.",
    inputSchema: doneToolSchema,
    execute: async (params) => {
      return { success: true, ...params };
    },
  });

  const userPrompt: ModelMessage = {
    role: "user",
    content: outputSchema
      ? "Provide your final assessment and the requested output data."
      : "Provide your final assessment.",
  };

  const result = await generateText({
    model,
    system: systemPrompt,
    messages: [...inputMessages, userPrompt],
    tools: { done: doneTool } as ToolSet,
    toolChoice: { type: "tool", toolName: "done" },
    providerOptions: {
      google: { mediaResolution: "MEDIA_RESOLUTION_HIGH" },
      openai: { store: false },
    },
  });

  const doneToolCall = result.toolCalls.find((tc) => tc.toolName === "done");
  const outputMessages: ModelMessage[] = [
    userPrompt,
    ...(result.response?.messages || []),
  ];

  if (!doneToolCall) {
    return {
      reasoning: result.text || "Task execution completed",
      taskComplete: false,
      messages: outputMessages,
    };
  }

  const input = doneToolCall.input as {
    reasoning: string;
    taskComplete: boolean;
    output?: Record<string, unknown>;
  };
  logger({
    category: "agent",
    message: `Task completed`,
    level: 1,
  });

  return {
    reasoning: input.reasoning,
    taskComplete: input.taskComplete,
    messages: outputMessages,
    output: input.output,
  };
}


================================================
FILE: packages/core/lib/v3/agent/utils/imageCompression.ts
================================================
import {
  AnthropicMessage,
  AnthropicContentBlock,
  AnthropicToolResult,
  ResponseInputItem as OpenAIResponseInputItem,
} from "../../types/public/agent.js";
import type {
  Content as GoogleContent,
  Part as GooglePart,
} from "@google/genai";

export type ResponseInputItem = AnthropicMessage | AnthropicToolResult;

interface FunctionResponseData {
  inlineData?: {
    mimeType?: string;
    data?: string;
  };
}
export type AnthropicResponseInputItem = AnthropicMessage | AnthropicToolResult;
export type SupportedInputItem =
  | AnthropicResponseInputItem
  | OpenAIResponseInputItem
  | GoogleContent;

/**
 * Finds all items in the conversation history that contain images
 * @param items - Array of conversation items to check
 * @returns Array of indices where images were found
 */
export function findItemsWithImages(items: ResponseInputItem[]): number[] {
  const itemsWithImages: number[] = [];

  items.forEach((item, index) => {
    let hasImage = false;

    if (Array.isArray(item.content)) {
      hasImage = item.content.some(
        (contentItem: AnthropicContentBlock) =>
          contentItem.type === "tool_result" &&
          "content" in contentItem &&
          Array.isArray(contentItem.content) &&
          (contentItem.content as AnthropicContentBlock[]).some(
            (nestedItem: AnthropicContentBlock) => nestedItem.type === "image",
          ),
      );
    }

    if (hasImage) {
      itemsWithImages.push(index);
    }
  });

  return itemsWithImages;
}

/**
 * Compresses conversation history by removing images from older items
 * while keeping the most recent images intact
 * @param items - Array of conversation items to process
 * @param keepMostRecentCount - Number of most recent image-containing items to preserve (default: 2)
 * @returns Object with processed items
 */
export function compressConversationImages(
  items: ResponseInputItem[],
  keepMostRecentCount: number = 2,
): { items: ResponseInputItem[] } {
  const itemsWithImages = findItemsWithImages(items);

  items.forEach((item, index) => {
    const imageIndex = itemsWithImages.indexOf(index);
    const shouldCompress =
      imageIndex >= 0 &&
      imageIndex < itemsWithImages.length - keepMostRecentCount;

    if (shouldCompress) {
      if (Array.isArray(item.content)) {
        item.content = item.content.map(
          (contentItem: AnthropicContentBlock) => {
            if (
              contentItem.type === "tool_result" &&
              "content" in contentItem &&
              Array.isArray(contentItem.content) &&
              (contentItem.content as AnthropicContentBlock[]).some(
                (nestedItem: AnthropicContentBlock) =>
                  nestedItem.type === "image",
              )
            ) {
              return {
                ...contentItem,
                content: "screenshot taken",
              } as AnthropicContentBlock;
            }
            return contentItem;
          },
        );
      }
    }
  });

  return {
    items,
  };
}

/**
 * Finds all items in the conversation history that contain images (Google format)
 * @param items - Array of conversation items to check
 * @returns Array of indices where images were found
 */
export function findGoogleItemsWithImages(items: GoogleContent[]): number[] {
  const itemsWithImages: number[] = [];

  items.forEach((item, index) => {
    let hasImage = false;

    if (item.parts && Array.isArray(item.parts)) {
      hasImage = item.parts.some((part: GooglePart) => {
        // Check for functionResponse with data containing images
        if (part.functionResponse?.response?.data) {
          const data = part.functionResponse.response
            .data as FunctionResponseData[];
          return data.some((dataItem) =>
            dataItem.inlineData?.mimeType?.startsWith("image/"),
          );
        }

        // Check for functionResponse with parts containing images
        if (part.functionResponse?.parts) {
          return part.functionResponse.parts.some((responsePart) =>
            responsePart.inlineData?.mimeType?.startsWith("image/"),
          );
        }

        // Check for direct inline data
        return part.inlineData?.mimeType?.startsWith("image/");
      });
    }

    if (hasImage) {
      itemsWithImages.push(index);
    }
  });

  return itemsWithImages;
}

/**
 * Finds all items in the conversation history that contain images (OpenAI format)
 * @param items - Array of conversation items to check
 * @returns Array of indices where images were found
 */
export function findOpenAIItemsWithImages(
  items: OpenAIResponseInputItem[],
): number[] {
  const itemsWithImages: number[] = [];

  items.forEach((item, index) => {
    let hasImage = false;

    // Check for computer_call_output with image
    if (
      "type" in item &&
      item.type === "computer_call_output" &&
      "output" in item
    ) {
      const output = item.output as unknown as {
        type: string;
        image_url: string;
      };
      hasImage = output?.type === "input_image" && !!output?.image_url;
    }

    if (hasImage) {
      itemsWithImages.push(index);
    }
  });

  return itemsWithImages;
}

/**
 * Compresses OpenAI conversation history by removing images from older items
 * while keeping the most recent images intact
 * @param items - Array of conversation items to process
 * @param keepMostRecentCount - Number of most recent image-containing items to preserve (default: 2)
 * @returns Object with processed items
 */
export function compressOpenAIConversationImages(
  items: OpenAIResponseInputItem[],
  keepMostRecentCount: number = 2,
): { items: OpenAIResponseInputItem[] } {
  const itemsWithImages = findOpenAIItemsWithImages(items);

  items.forEach((item, index) => {
    const imageIndex = itemsWithImages.indexOf(index);
    const shouldCompress =
      imageIndex >= 0 &&
      imageIndex < itemsWithImages.length - keepMostRecentCount;

    if (shouldCompress) {
      // For computer_call_output with image, replace with text
      if (
        "type" in item &&
        item.type === "computer_call_output" &&
        "output" in item
      ) {
        const output = item.output as unknown as { type: string };
        if (output?.type === "input_image") {
          // Replace the image with a text message
          (item as unknown as { output: string }).output = "screenshot taken";
        }
      }
    }
  });

  return {
    items,
  };
}

/**
 * Compresses Google conversation history by removing images from older items
 * while keeping the most recent images intact
 * @param items - Array of conversation items to process
 * @param keepMostRecentCount - Number of most recent image-containing items to preserve (default: 2)
 * @returns Object with processed items
 */
export function compressGoogleConversationImages(
  items: GoogleContent[],
  keepMostRecentCount: number = 2,
): { items: GoogleContent[] } {
  const itemsWithImages = findGoogleItemsWithImages(items);

  items.forEach((item, index) => {
    const imageIndex = itemsWithImages.indexOf(index);
    const shouldCompress =
      imageIndex >= 0 &&
      imageIndex < itemsWithImages.length - keepMostRecentCount;

    if (shouldCompress && item.parts && Array.isArray(item.parts)) {
      item.parts = item.parts.map((part: GooglePart) => {
        // Replace functionResponse with data containing images
        if (part.functionResponse?.response?.data) {
          const data = part.functionResponse.response
            .data as FunctionResponseData[];
          const hasImage = data.some((dataItem) =>
            dataItem.inlineData?.mimeType?.startsWith("image/"),
          );
          if (hasImage) {
            return {
              ...part,
              functionResponse: {
                ...part.functionResponse,
                data: [] as FunctionResponseData[],
                response: {
                  ...part.functionResponse.response,
                  compressed: "screenshot taken",
                },
              },
            };
          }
        }

        // Replace functionResponse with parts containing images
        if (part.functionResponse?.parts) {
          const hasImageInParts = part.functionResponse.parts.some(
            (responsePart) =>
              responsePart.inlineData?.mimeType?.startsWith("image/"),
          );
          if (hasImageInParts) {
            return {
              ...part,
              functionResponse: {
                ...part.functionResponse,
                parts: part.functionResponse.parts.filter(
                  (responsePart) =>
                    !responsePart.inlineData?.mimeType?.startsWith("image/"),
                ),
                response: {
                  ...part.functionResponse.response,
                  compressed: "screenshot taken",
                },
              },
            };
          }
        }

        // Replace direct inline data images
        if (part.inlineData?.mimeType?.startsWith("image/")) {
          return {
            text: "screenshot taken",
          };
        }
        return part;
      });
    }
  });

  return {
    items,
  };
}


================================================
FILE: packages/core/lib/v3/agent/utils/messageProcessing.ts
================================================
import type { ModelMessage } from "ai";

// Vision action tools that include screenshots in their results
const VISION_ACTION_TOOLS = [
  "click",
  "type",
  "dragAndDrop",
  "wait",
  "fillFormVision",
  "scroll",
];

function isToolMessage(
  message: unknown,
): message is { role: "tool"; content: unknown[] } {
  return (
    !!message &&
    typeof message === "object" &&
    (message as { role?: unknown }).role === "tool" &&
    Array.isArray((message as { content?: unknown }).content)
  );
}

function isScreenshotPart(part: unknown): boolean {
  return (
    !!part &&
    typeof part === "object" &&
    (part as { toolName?: unknown }).toolName === "screenshot"
  );
}

function isVisionActionPart(part: unknown): boolean {
  if (!part || typeof part !== "object") return false;
  const toolName = (part as { toolName?: unknown }).toolName;
  return typeof toolName === "string" && VISION_ACTION_TOOLS.includes(toolName);
}

function isVisionPart(part: unknown): boolean {
  return isScreenshotPart(part) || isVisionActionPart(part);
}

function isAriaTreePart(part: unknown): boolean {
  return (
    !!part &&
    typeof part === "object" &&
    (part as { toolName?: unknown }).toolName === "ariaTree"
  );
}

/**
 * Compress old screenshot/ariaTree data in messages in-place.
 *
 * Strategy:
 * - Keep only the 2 most recent vision results (screenshots OR vision action tools like click/type/etc)
 * - Keep only the 1 most recent ariaTree (replace older ones with placeholder)
 *
 * @param messages - The messages array to modify in-place
 * @returns Number of items compressed
 */
export function processMessages(messages: ModelMessage[]): number {
  let compressedCount = 0;

  // Find indices of all vision-related tool results (screenshots + vision actions)
  // and ariaTree results
  const visionIndices: number[] = [];
  const ariaTreeIndices: number[] = [];

  for (let i = 0; i < messages.length; i++) {
    const message = messages[i];
    if (isToolMessage(message)) {
      const content = message.content as unknown[];
      if (content.some(isVisionPart)) {
        visionIndices.push(i);
      }
      if (content.some(isAriaTreePart)) {
        ariaTreeIndices.push(i);
      }
    }
  }

  // Compress old vision results (keep 2 most recent across all vision tools)
  if (visionIndices.length > 2) {
    const toCompress = visionIndices.slice(0, visionIndices.length - 2);
    for (const index of toCompress) {
      const message = messages[index];
      if (isToolMessage(message)) {
        // Both functions are safe to call - they only modify their respective part types
        compressScreenshotMessage(message);
        compressVisionActionMessage(message);
        compressedCount++;
      }
    }
  }

  // Compress old ariaTree results (keep 1 most recent)
  if (ariaTreeIndices.length > 1) {
    const toCompress = ariaTreeIndices.slice(0, ariaTreeIndices.length - 1);
    for (const idx of toCompress) {
      const message = messages[idx];
      if (isToolMessage(message)) {
        compressAriaTreeMessage(message);
        compressedCount++;
      }
    }
  }

  return compressedCount;
}

/**
 * Tool result part structure from AI SDK.
 * The output field uses a discriminated union - type determines value format:
 * - type: "content" -> value: Array<{type: "text", ...} | {type: "media", ...}>
 * - type: "text" -> value: string
 * - type: "json" -> value: JSONValue
 * - type: "error-text" -> value: string
 * - type: "error-json" -> value: JSONValue
 */
interface ToolResultPart {
  output?: {
    type: string;
    value?: unknown;
  };
}

/**
 * Check if output has type "content" (array-based value format).
 * Only outputs with type "content" should have array values.
 */
function isContentTypeOutput(output: {
  type: string;
  value?: unknown;
}): boolean {
  return output.type === "content";
}

/**
 * Compress screenshot message content in-place.
 * Only modifies outputs with type "content" to maintain schema validity.
 * Replaces entire output object to ensure type/value consistency.
 */
function compressScreenshotMessage(message: {
  role: "tool";
  content: unknown[];
}): void {
  for (const part of message.content) {
    if (isScreenshotPart(part)) {
      const typedPart = part as ToolResultPart;
      // Only compress if output exists and has type "content"
      if (typedPart.output && isContentTypeOutput(typedPart.output)) {
        // Replace entire output to ensure type/value consistency
        typedPart.output = {
          type: "content",
          value: [{ type: "text", text: "screenshot taken" }],
        };
      }
    }
  }
}

/**
 * Compress vision action message content in-place by removing the screenshot
 * but keeping the action result text.
 * Only modifies outputs with type "content" to maintain schema validity.
 */
function compressVisionActionMessage(message: {
  role: "tool";
  content: unknown[];
}): void {
  for (const part of message.content) {
    if (isVisionActionPart(part)) {
      const typedPart = part as ToolResultPart;

      // Only compress if output is type "content" (array-based value)
      if (
        typedPart.output &&
        isContentTypeOutput(typedPart.output) &&
        Array.isArray(typedPart.output.value)
      ) {
        // Filter out media content but keep text results
        const filteredValue = (
          typedPart.output.value as Array<{ type?: string }>
        ).filter(
          (item) => item && typeof item === "object" && item.type !== "media",
        );
        // Replace entire output to ensure type/value consistency
        typedPart.output = {
          type: "content",
          value: filteredValue,
        };
      }
    }
  }
}

/**
 * Compress ariaTree message content in-place.
 * Only modifies outputs with type "content" to maintain schema validity.
 * Replaces entire output object to ensure type/value consistency.
 */
function compressAriaTreeMessage(message: {
  role: "tool";
  content: unknown[];
}): void {
  for (const part of message.content) {
    if (isAriaTreePart(part)) {
      const typedPart = part as ToolResultPart;
      // Only compress if output exists and has type "content"
      if (typedPart.output && isContentTypeOutput(typedPart.output)) {
        typedPart.output = {
          type: "content",
          value: [
            {
              type: "text",
              text: "ARIA tree extracted for context of page elements",
            },
          ],
        };
      }
    }
  }
}


================================================
FILE: packages/core/lib/v3/agent/utils/screenshotHandler.ts
================================================
import type { Page } from "../../understudy/page.js";

/**
 * Default delay in milliseconds to wait after vision actions before capturing screenshot.
 * Allows the page to settle after interactions.
 */
const DEFAULT_DELAY_MS = 500;

/**
 * Waits for the page to settle and captures a screenshot.
 * If the screenshot fails (e.g., page closed, navigation in progress),
 * returns undefined instead of throwing - allowing the action to still succeed.
 *
 * @param page - The page to capture
 * @param delayMs - Delay before capturing (default: 500ms, pass 0 to skip delay)
 */
export async function waitAndCaptureScreenshot(
  page: Page,
  delayMs: number = DEFAULT_DELAY_MS,
): Promise<string | undefined> {
  if (delayMs > 0) {
    await page.waitForTimeout(delayMs);
  }

  try {
    const buffer = await page.screenshot({ fullPage: false });
    return buffer.toString("base64");
  } catch {
    return undefined;
  }
}


================================================
FILE: packages/core/lib/v3/agent/utils/validateExperimentalFeatures.ts
================================================
import {
  ExperimentalNotConfiguredError,
  StagehandInvalidArgumentError,
} from "../../types/public/sdkErrors.js";
import type {
  AgentConfig,
  AgentExecuteOptionsBase,
} from "../../types/public/index.js";

export interface AgentValidationOptions {
  /** Whether experimental mode is enabled */
  isExperimental: boolean;
  /** Agent config options (integrations, tools, stream, cua, etc.) */
  agentConfig?: Partial<AgentConfig>;
  /** Execute options (callbacks, signal, messages, etc.) */
  executeOptions?:
    | (Partial<AgentExecuteOptionsBase> & { callbacks?: unknown })
    | null;
  /** Whether this is streaming mode (can be derived from agentConfig.stream) */
  isStreaming?: boolean;
}

/**
 * Validates agent configuration and experimental feature usage.
 *
 * This utility consolidates all validation checks for both CUA and non-CUA agent paths:
 * - Invalid argument errors for CUA (streaming, abort signal, message continuation, excludeTools, output schema are not supported)
 * - Experimental feature checks for integrations and tools (both CUA and non-CUA)
 * - Experimental feature checks for hybrid mode (requires experimental: true)
 * - Experimental feature checks for non-CUA only (callbacks, signal, messages, streaming, excludeTools, output schema)
 *
 * Throws StagehandInvalidArgumentError for invalid/unsupported configurations.
 * Throws ExperimentalNotConfiguredError if experimental features are used without experimental mode.
 */
export function validateExperimentalFeatures(
  options: AgentValidationOptions,
): void {
  const { isExperimental, agentConfig, executeOptions, isStreaming } = options;

  // Check if CUA mode is enabled (via mode: "cua" or deprecated cua: true)
  const isCuaMode =
    agentConfig?.mode !== undefined
      ? agentConfig.mode === "cua"
      : agentConfig?.cua === true;

  // CUA-specific validation: certain features are not available at all
  if (isCuaMode) {
    const unsupportedFeatures: string[] = [];

    if (agentConfig?.stream) {
      unsupportedFeatures.push("streaming");
    }
    if (executeOptions?.signal) {
      unsupportedFeatures.push("abort signal");
    }
    if (executeOptions?.messages) {
      unsupportedFeatures.push("message continuation");
    }
    if (
      executeOptions?.excludeTools &&
      executeOptions.excludeTools.length > 0
    ) {
      unsupportedFeatures.push("excludeTools");
    }
    if (executeOptions?.output) {
      unsupportedFeatures.push("output schema");
    }
    if (
      executeOptions?.variables &&
      Object.keys(executeOptions.variables).length > 0
    ) {
      unsupportedFeatures.push("variables");
    }

    if (unsupportedFeatures.length > 0) {
      throw new StagehandInvalidArgumentError(
        `${unsupportedFeatures.join(", ")} ${unsupportedFeatures.length === 1 ? "is" : "are"} not supported with CUA (Computer Use Agent) mode.`,
      );
    }
  }

  // Skip experimental checks if already in experimental mode
  if (isExperimental) return;

  const features: string[] = [];

  // Check agent config features (check array length to avoid false positives for empty arrays)
  const hasIntegrations =
    agentConfig?.integrations && agentConfig.integrations.length > 0;
  const hasTools =
    agentConfig?.tools && Object.keys(agentConfig.tools).length > 0;
  if (hasIntegrations || hasTools) {
    features.push("MCP integrations and custom tools");
  }

  // Check streaming mode (either explicit or derived from config) - only for non-CUA
  if (!isCuaMode && (isStreaming || agentConfig?.stream)) {
    features.push("streaming");
  }

  // Check execute options features - only for non-CUA
  if (executeOptions && !isCuaMode) {
    if (executeOptions.callbacks) {
      features.push("callbacks");
    }
    if (executeOptions.signal) {
      features.push("abort signal");
    }
    if (executeOptions.messages) {
      features.push("message continuation");
    }
    if (executeOptions.excludeTools && executeOptions.excludeTools.length > 0) {
      features.push("excludeTools");
    }
    if (executeOptions.output) {
      features.push("output schema");
    }
    if (
      executeOptions.variables &&
      Object.keys(executeOptions.variables).length > 0
    ) {
      features.push("variables");
    }
  }

  if (features.length > 0) {
    throw new ExperimentalNotConfiguredError(`Agent ${features.join(", ")}`);
  }
}


================================================
FILE: packages/core/lib/v3/agent/utils/variables.ts
================================================
import type { Variables, VariableValue } from "../../types/public/agent.js";

/**
 * Resolves a VariableValue to its primitive string value.
 * Handles both simple primitives ("secret") and rich objects ({ value: "secret", description: "..." }).
 */
export function resolveVariableValue(v: VariableValue): string {
  if (typeof v === "object" && v !== null && "value" in v) {
    return String(v.value);
  }
  return String(v);
}

/**
 * Extracts the optional description from a VariableValue.
 * Returns undefined for simple primitive values.
 */
export function getVariableDescription(v: VariableValue): string | undefined {
  if (typeof v === "object" && v !== null && "value" in v) {
    return v.description;
  }
  return undefined;
}

/**
 * Substitutes %variableName% tokens in text with resolved variable values.
 * Works with both simple and rich variable formats.
 */
export function substituteVariables(
  text: string,
  variables?: Variables,
): string {
  if (!variables) return text;
  let result = text;
  for (const [key, v] of Object.entries(variables)) {
    const token = `%${key}%`;
    result = result.split(token).join(resolveVariableValue(v));
  }
  return result;
}

/**
 * Flattens Variables to Record<string, string> for internal consumers
 * that only need key→value mappings (e.g., actHandler, cache replay).
 */
export function flattenVariables(
  variables?: Variables,
): Record<string, string> | undefined {
  if (!variables || Object.keys(variables).length === 0) return undefined;
  const result: Record<string, string> = {};
  for (const [key, v] of Object.entries(variables)) {
    result[key] = resolveVariableValue(v);
  }
  return result;
}


================================================
FILE: packages/core/lib/v3/agent/utils/xpath.ts
================================================
/**
 * Utility functions for XPath handling in agent tools.
 */

/**
 * Ensures a value is properly formatted as an XPath selector.
 * Returns null if the value is not a valid string.
 *
 * @param value - The value to normalize as an XPath
 * @returns The normalized XPath string prefixed with "xpath=" or null
 */
export function ensureXPath(value: unknown): string | null {
  if (typeof value !== "string") return null;
  const trimmed = value.trim();
  if (!trimmed) return null;
  return trimmed.startsWith("xpath=") ? trimmed : `xpath=${trimmed}`;
}


================================================
FILE: packages/core/lib/v3/api.ts
================================================
import makeFetchCookie from "fetch-cookie";
import { loadApiKeyFromEnv } from "../utils.js";
import { STAGEHAND_VERSION } from "../version.js";
import {
  StagehandAPIError,
  StagehandAPIUnauthorizedError,
  StagehandHttpError,
  StagehandResponseBodyError,
  StagehandResponseParseError,
  StagehandServerError,
  ExperimentalNotConfiguredError,
} from "./types/public/index.js";
import type {
  ActResult,
  AgentConfig,
  AgentExecuteOptions,
  AgentResult,
  ExtractResult,
  ObserveResult,
  LogLine,
  StagehandMetrics,
  BrowserbaseRegion,
  ActOptions,
  ExtractOptions,
  ObserveOptions,
  Api,
} from "./types/public/index.js";
import type {
  SerializableResponse,
  AgentCacheTransferPayload,
} from "./types/private/index.js";
import type { ModelConfiguration } from "./types/public/model.js";
import { toJsonSchema } from "./zodCompat.js";
import type { StagehandZodSchema } from "./zodCompat.js";

// =============================================================================
// Multi-region API URL mapping
// =============================================================================

/**
 * Mapping of Browserbase regions to their corresponding Stagehand API base URLs.
 * Users should configure their client to hit the API endpoint that matches
 * the region where their browser session is running.
 */
export const REGION_API_URLS: Record<BrowserbaseRegion, string> = {
  "us-west-2": "https://api.stagehand.browserbase.com",
  "us-east-1": "https://api.use1.stagehand.browserbase.com",
  "eu-central-1": "https://api.euc1.stagehand.browserbase.com",
  "ap-southeast-1": "https://api.apse1.stagehand.browserbase.com",
};

/**
 * Returns the full API URL (with /v1 suffix) for a given Browserbase region.
 * If no region is specified or the region is unknown, defaults to us-west-2.
 *
 * @param region - The Browserbase region (e.g., "us-west-2", "eu-central-1")
 * @returns The full API URL including /v1 suffix
 */
export function getApiUrlForRegion(
  region: BrowserbaseRegion | undefined,
): string {
  const baseUrl =
    REGION_API_URLS[region as BrowserbaseRegion] ??
    REGION_API_URLS["us-west-2"];
  return `${baseUrl}/v1`;
}

// =============================================================================
// Client-specific types (can't be Zod schemas due to functions/Page objects)
// =============================================================================
//
// These types mirror the Api.* schemas from types/public/api.ts but include
// non-serializable SDK fields (like Page objects) that get stripped before
// sending requests over the wire.
//
// Relationship to wire format:
// - Client accepts: SDK types (ActOptions, ExtractOptions, etc.) with optional `page`
// - Wire sends: Api.* types (page stripped, Zod schema converted to JSON schema)
// - Client returns: SDK result types (ActResult, ExtractResult, etc.)
// =============================================================================

/**
 * Constructor parameters for StagehandAPIClient
 */
interface StagehandAPIConstructorParams {
  apiKey: string;
  projectId?: string;
  logger: (message: LogLine) => void;
  /**
   * When true, enables server-side caching by default for all requests.
   * When false, disables server-side caching.
   * Defaults to true (caching enabled).
   * Can be overridden per-method in act(), extract(), and observe() options.
   */
  serverCache?: boolean;
}

/**
 * Parameters for starting a session via the API client.
 * Extends Api.SessionStartRequest with client-specific field (modelApiKey).
 *
 * Wire format: Api.SessionStartRequest (modelApiKey sent via header, not body)
 */
interface ClientSessionStartParams extends Api.SessionStartRequest {
  /** Model API key - sent via x-model-api-key header, not in request body */
  modelApiKey: string;
}

/**
 * Generic API response wrapper matching Api.*Response schemas
 */
type ApiResponse<T> =
  | { success: true; data: T }
  | { success: false; message: string };

/**
 * Union of all API request body types for type-safe execute() calls
 */
type ApiRequestBody =
  | Api.ActRequest
  | Api.ExtractRequest
  | Api.ObserveRequest
  | Api.NavigateRequest
  | Api.AgentExecuteRequest;

/**
 * Parameters for executing an action via the streaming API
 */
interface ExecuteActionParams {
  method: "act" | "extract" | "observe" | "navigate" | "end" | "agentExecute";
  args?: ApiRequestBody;
  params?: Record<string, string>;
  /**
   * Override the instance-level serverCache setting for this request.
   * When true, enables server-side caching.
   * When false, disables server-side caching.
   */
  serverCache?: boolean;
}

/**
 * Client parameters for act() method.
 * Derives structure from Api.ActRequest but uses SDK's ActOptions (which includes `page`).
 * Before serialization, `page` is stripped to produce Api.ActRequest wire format.
 */
interface ClientActParameters {
  input: Api.ActRequest["input"];
  options?: ActOptions;
  frameId?: Api.ActRequest["frameId"];
}

/**
 * Client parameters for extract() method.
 * Derives structure from Api.ExtractRequest but uses SDK's ExtractOptions (which includes `page`)
 * and accepts Zod schema (converted to JSON schema for wire format).
 */
interface ClientExtractParameters {
  instruction?: Api.ExtractRequest["instruction"];
  schema?: StagehandZodSchema;
  options?: ExtractOptions;
  frameId?: Api.ExtractRequest["frameId"];
}

/**
 * Client parameters for observe() method.
 * Derives structure from Api.ObserveRequest but uses SDK's ObserveOptions (which includes `page`).
 * Before serialization, `page` is stripped to produce Api.ObserveRequest wire format.
 */
interface ClientObserveParameters {
  instruction?: Api.ObserveRequest["instruction"];
  options?: ObserveOptions;
  frameId?: Api.ObserveRequest["frameId"];
}

export class StagehandAPIClient {
  private apiKey: string;
  private projectId?: string;
  private sessionId?: string;
  private modelApiKey: string;
  private modelProvider?: string;
  private region?: BrowserbaseRegion;
  private logger: (message: LogLine) => void;
  private fetchWithCookies;
  private serverCache: boolean;
  private lastFinishedEventData: Record<string, unknown> | null = null;
  private latestAgentCacheEntry: AgentCacheTransferPayload | null = null;

  constructor({
    apiKey,
    projectId,
    logger,
    serverCache,
  }: StagehandAPIConstructorParams) {
    this.apiKey = apiKey;
    this.projectId = projectId;
    this.logger = logger;
    this.serverCache = serverCache ?? true;
    // Create a single cookie jar instance that will persist across all requests
    this.fetchWithCookies = makeFetchCookie(fetch);
  }

  async init({
    modelName,
    modelApiKey,
    domSettleTimeoutMs,
    verbose,
    systemPrompt,
    selfHeal,
    browserbaseSessionCreateParams,
    browserbaseSessionID,
    // browser,  TODO for local browsers
  }: ClientSessionStartParams): Promise<Api.SessionStartResult> {
    if (!modelApiKey) {
      throw new StagehandAPIError("modelApiKey is required");
    }
    this.modelApiKey = modelApiKey;
    // Extract provider from modelName (e.g., "openai/gpt-5-nano" -> "openai")
    this.modelProvider = modelName?.includes("/")
      ? modelName.split("/")[0]
      : undefined;

    // Store the region for multi-region API URL resolution
    this.region = browserbaseSessionCreateParams?.region;

    this.logger({
      category: "init",
      message: "Creating new browserbase session...",
      level: 1,
    });

    // Build wire-format request body (Api.SessionStartRequest shape)
    const requestBody: Api.SessionStartRequest = {
      modelName,
      domSettleTimeoutMs,
      verbose,
      systemPrompt,
      selfHeal,
      browserbaseSessionCreateParams,
      browserbaseSessionID,
      // browser, TODO: only send when connected to local fastify
    };

    const sessionResponse = await this.request("/sessions/start", {
      method: "POST",
      body: JSON.stringify(requestBody),
    });

    if (sessionResponse.status === 401) {
      throw new StagehandAPIUnauthorizedError(
        "Unauthorized. Ensure you provided a valid API key.",
      );
    } else if (sessionResponse.status !== 200) {
      const errorText = await sessionResponse.text();
      this.logger({
        category: "api",
        message: `API error (${sessionResponse.status}): ${errorText}`,
        level: 0,
      });
      throw new StagehandHttpError(`Unknown error: ${sessionResponse.status}`);
    }

    const sessionResponseBody =
      (await sessionResponse.json()) as ApiResponse<Api.SessionStartResult>;

    if (sessionResponseBody.success === false) {
      throw new StagehandAPIError(sessionResponseBody.message);
    }

    // Temporary reroute for rollout
    if (!sessionResponseBody.data?.available && browserbaseSessionID) {
      sessionResponseBody.data.sessionId = browserbaseSessionID;
    }

    this.sessionId = sessionResponseBody.data.sessionId;

    return sessionResponseBody.data;
  }

  async act({
    input,
    options,
    frameId,
  }: ClientActParameters): Promise<ActResult> {
    // Strip non-serializable `page` and SDK-only fields from options before wire serialization
    let wireOptions: Api.ActRequest["options"];
    let serverCache: boolean | undefined;
    if (options) {
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      const { page: _, serverCache: enableCache, ...restOptions } = options;
      serverCache = enableCache;
      if (Object.keys(restOptions).length > 0) {
        if (restOptions.model) {
          restOptions.model = this.prepareModelConfig(restOptions.model);
        }
        wireOptions = restOptions as unknown as Api.ActRequest["options"];
      }
    }

    // Build wire-format request body
    const requestBody: Api.ActRequest = {
      input,
      options: wireOptions,
      frameId,
    };

    return this.execute<ActResult>({
      method: "act",
      args: requestBody,
      serverCache,
    });
  }

  async extract<T extends StagehandZodSchema>({
    instruction,
    schema: zodSchema,
    options,
    frameId,
  }: ClientExtractParameters): Promise<ExtractResult<T>> {
    // Convert Zod schema to JSON schema for wire format
    const jsonSchema = zodSchema ? toJsonSchema(zodSchema) : undefined;

    // Strip non-serializable `page` and SDK-only fields from options before wire serialization
    let wireOptions: Api.ExtractRequest["options"];
    let serverCache: boolean | undefined;
    if (options) {
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      const { page: _, serverCache: enableCache, ...restOptions } = options;
      serverCache = enableCache;
      if (Object.keys(restOptions).length > 0) {
        if (restOptions.model) {
          restOptions.model = this.prepareModelConfig(restOptions.model);
        }
        wireOptions = restOptions as unknown as Api.ExtractRequest["options"];
      }
    }

    // Build wire-format request body
    const requestBody: Api.ExtractRequest = {
      instruction,
      schema: jsonSchema,
      options: wireOptions,
      frameId,
    };

    return this.execute<ExtractResult<T>>({
      method: "extract",
      args: requestBody,
      serverCache,
    });
  }

  async observe({
    instruction,
    options,
    frameId,
  }: ClientObserveParameters): Promise<ObserveResult> {
    // Strip non-serializable `page` and SDK-only fields from options before wire serialization
    let wireOptions: Api.ObserveRequest["options"];
    let serverCache: boolean | undefined;
    if (options) {
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      const { page: _, serverCache: enableCache, ...restOptions } = options;
      serverCache = enableCache;
      if (Object.keys(restOptions).length > 0) {
        if (restOptions.model) {
          restOptions.model = this.prepareModelConfig(restOptions.model);
        }
        wireOptions = restOptions as unknown as Api.ObserveRequest["options"];
      }
    }

    // Build wire-format request body
    const requestBody: Api.ObserveRequest = {
      instruction,
      options: wireOptions,
      frameId,
    };

    return this.execute<ObserveResult>({
      method: "observe",
      args: requestBody,
      serverCache,
    });
  }

  async goto(
    url: string,
    options?: Api.NavigateRequest["options"],
    frameId?: string,
  ): Promise<SerializableResponse | null> {
    const requestBody: Api.NavigateRequest = { url, options, frameId };

    return this.execute<SerializableResponse | null>({
      method: "navigate",
      args: requestBody,
    });
  }

  async agentExecute(
    agentConfig: AgentConfig,
    executeOptions: AgentExecuteOptions | string,
    frameId?: string,
    shouldCache?: boolean,
  ): Promise<AgentResult> {
    // Check if integrations are being used in API mode (not supported)
    if (agentConfig.integrations && agentConfig.integrations.length > 0) {
      throw new ExperimentalNotConfiguredError("MCP integrations");
    }

    // Strip non-serializable `page` from executeOptions before wire serialization
    let wireExecuteOptions: Api.AgentExecuteRequest["executeOptions"];
    if (typeof executeOptions === "string") {
      wireExecuteOptions = { instruction: executeOptions };
    } else if (executeOptions.page) {
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      const { page: _, ...rest } = executeOptions;
      wireExecuteOptions = rest;
    } else {
      wireExecuteOptions = executeOptions;
    }

    const wireAgentConfig: Api.AgentExecuteRequest["agentConfig"] = {
      systemPrompt: agentConfig.systemPrompt,
      mode: agentConfig.mode ?? (agentConfig.cua === true ? "cua" : undefined),
      cua: agentConfig.mode === undefined ? agentConfig.cua : undefined,
      model: agentConfig.model
        ? this.prepareModelConfig(agentConfig.model)
        : undefined,
      executionModel: agentConfig.executionModel
        ? this.prepareModelConfig(agentConfig.executionModel)
        : undefined,
    };

    // Build wire-format request body
    const requestBody: Api.AgentExecuteRequest = {
      agentConfig: wireAgentConfig,
      executeOptions: wireExecuteOptions,
      frameId,
      shouldCache,
    };

    const result = await this.execute<AgentResult>({
      method: "agentExecute",
      args: requestBody,
    });

    const finishedData =
      this.consumeFinishedEventData<Api.AgentExecuteResult>() ?? null;
    this.latestAgentCacheEntry =
      finishedData?.cacheEntry !== undefined
        ? (finishedData.cacheEntry as AgentCacheTransferPayload)
        : null;
    return result;
  }

  consumeLatestAgentCacheEntry(): AgentCacheTransferPayload | null {
    const entry = this.latestAgentCacheEntry;
    this.latestAgentCacheEntry = null;
    return entry;
  }

  async end(): Promise<Response> {
    const url = `/sessions/${this.sessionId}/end`;
    const response = await this.request(url, {
      method: "POST",
    });
    return response;
  }

  async getReplayMetrics(): Promise<StagehandMetrics> {
    if (!this.sessionId) {
      throw new StagehandAPIError("sessionId is required to fetch metrics.");
    }

    const response = await this.request(`/sessions/${this.sessionId}/replay`, {
      method: "GET",
    });

    if (response.status !== 200) {
      const errorText = await response.text();
      this.logger({
        category: "api",
        message: `Failed to fetch metrics. Status ${response.status}: ${errorText}`,
        level: 0,
      });
      throw new StagehandHttpError(
        `Failed to fetch metrics with status ${response.status}: ${errorText}`,
      );
    }

    const data = (await response.json()) as
      | Api.ReplayResponse
      | { success: false; error?: string };

    if (!data.success) {
      const errorData = data as { success: false; error?: string };
      throw new StagehandAPIError(
        `Failed to fetch metrics: ${errorData.error || "Unknown error"}`,
      );
    }

    // Parse the API data into StagehandMetrics format
    const apiData = (data as Api.ReplayResponse).data;
    const metrics: StagehandMetrics = {
      actPromptTokens: 0,
      actCompletionTokens: 0,
      actReasoningTokens: 0,
      actCachedInputTokens: 0,
      actInferenceTimeMs: 0,
      extractPromptTokens: 0,
      extractCompletionTokens: 0,
      extractReasoningTokens: 0,
      extractCachedInputTokens: 0,
      extractInferenceTimeMs: 0,
      observePromptTokens: 0,
      observeCompletionTokens: 0,
      observeReasoningTokens: 0,
      observeCachedInputTokens: 0,
      observeInferenceTimeMs: 0,
      agentPromptTokens: 0,
      agentCompletionTokens: 0,
      agentReasoningTokens: 0,
      agentCachedInputTokens: 0,
      agentInferenceTimeMs: 0,
      totalPromptTokens: 0,
      totalCompletionTokens: 0,
      totalReasoningTokens: 0,
      totalCachedInputTokens: 0,
      totalInferenceTimeMs: 0,
    };

    // Parse pages and their actions
    const pages = apiData?.pages || [];
    for (const page of pages) {
      const actions = page.actions || [];
      for (const action of actions) {
        // Get method name and token usage
        const method = (action.method || "").toLowerCase();
        const tokenUsage = action.tokenUsage;

        if (tokenUsage) {
          const inputTokens = tokenUsage.inputTokens || 0;
          const outputTokens = tokenUsage.outputTokens || 0;
          const reasoningTokens =
            "reasoningTokens" in tokenUsage
              ? Number(
                  (tokenUsage as { reasoningTokens?: number })
                    .reasoningTokens ?? 0,
                )
              : 0;
          const cachedInputTokens =
            "cachedInputTokens" in tokenUsage
              ? Number(
                  (tokenUsage as { cachedInputTokens?: number })
                    .cachedInputTokens ?? 0,
                )
              : 0;
          const timeMs = tokenUsage.timeMs || 0;

          // Map method to metrics fields
          if (method === "act") {
            metrics.actPromptTokens += inputTokens;
            metrics.actCompletionTokens += outputTokens;
            metrics.actReasoningTokens += reasoningTokens;
            metrics.actCachedInputTokens += cachedInputTokens;
            metrics.actInferenceTimeMs += timeMs;
          } else if (method === "extract") {
            metrics.extractPromptTokens += inputTokens;
            metrics.extractCompletionTokens += outputTokens;
            metrics.extractReasoningTokens += reasoningTokens;
            metrics.extractCachedInputTokens += cachedInputTokens;
            metrics.extractInferenceTimeMs += timeMs;
          } else if (method === "observe") {
            metrics.observePromptTokens += inputTokens;
            metrics.observeCompletionTokens += outputTokens;
            metrics.observeReasoningTokens += reasoningTokens;
            metrics.observeCachedInputTokens += cachedInputTokens;
            metrics.observeInferenceTimeMs += timeMs;
          } else if (method === "agent") {
            metrics.agentPromptTokens += inputTokens;
            metrics.agentCompletionTokens += outputTokens;
            metrics.agentReasoningTokens += reasoningTokens;
            metrics.agentCachedInputTokens += cachedInputTokens;
            metrics.agentInferenceTimeMs += timeMs;
          }

          // Always update totals for any method with token usage
          metrics.totalPromptTokens += inputTokens;
          metrics.totalCompletionTokens += outputTokens;
          metrics.totalReasoningTokens += reasoningTokens;
          metrics.totalCachedInputTokens += cachedInputTokens;
          metrics.totalInferenceTimeMs += timeMs;
        }
      }
    }

    return metrics;
  }

  /**
   * Prepares a model configuration for the API payload by ensuring the `apiKey`
   * is included. If the model is passed as a string, converts it to an object
   * with `modelName` and `apiKey`.
   *
   * In API mode, we only attempt to load an API key from env vars when the
   * model provider differs from the one used to init the session.
   */
  private prepareModelConfig(
    model: ModelConfiguration,
  ): { modelName: string; apiKey: string } & Record<string, unknown> {
    if (typeof model === "string") {
      // Extract provider from model string (e.g., "openai/gpt-5-nano" -> "openai")
      const provider = model.includes("/") ? model.split("/")[0] : undefined;
      const apiKey =
        provider && provider !== this.modelProvider
          ? (loadApiKeyFromEnv(provider, this.logger) ?? this.modelApiKey)
          : this.modelApiKey;
      return {
        modelName: model,
        apiKey,
      };
    }

    if (!model.apiKey) {
      const provider = model.modelName?.includes("/")
        ? model.modelName.split("/")[0]
        : undefined;
      const apiKey =
        provider && provider !== this.modelProvider
          ? (loadApiKeyFromEnv(provider, this.logger) ?? this.modelApiKey)
          : this.modelApiKey;
      return {
        ...model,
        apiKey,
      };
    }

    return model as { modelName: string; apiKey: string } & Record<
      string,
      unknown
    >;
  }

  private consumeFinishedEventData<T>(): T | null {
    const data = this.lastFinishedEventData as T | null;
    this.lastFinishedEventData = null;
    return data;
  }

  private async execute<T>({
    method,
    args,
    params,
    serverCache,
  }: ExecuteActionParams): Promise<T> {
    this.lastFinishedEventData = null;
    const urlParams = new URLSearchParams(params as Record<string, string>);
    const queryString = urlParams.toString();
    const url = `/sessions/${this.sessionId}/${method}${queryString ? `?${queryString}` : ""}`;

    const response = await this.request(
      url,
      {
        method: "POST",
        body: JSON.stringify(args),
      },
      serverCache,
    );

    // Capture cache status from response header
    const cacheStatus = response.headers.get("browserbase-cache-status") as
      | "HIT"
      | "MISS"
      | null;

    if (!response.ok) {
      const errorBody = await response.text();
      throw new StagehandHttpError(
        `HTTP error! status: ${response.status}, body: ${errorBody}`,
      );
    }

    if (!response.body) {
      throw new StagehandResponseBodyError();
    }

    const reader = response.body.getReader();
    const decoder = new TextDecoder();
    let buffer = "";

    while (true) {
      const { value, done } = await reader.read();

      if (done && !buffer) {
        throw new StagehandServerError(
          "Stream ended without completion signal",
        );
      }

      buffer += decoder.decode(value, { stream: true });
      const lines = buffer.split("\n\n");
      buffer = lines.pop() || "";

      for (const line of lines) {
        if (!line.startsWith("data: ")) continue;

        try {
          const eventData = JSON.parse(line.slice(6));

          if (eventData.type === "system") {
            if (eventData.data.status === "error") {
              const { error: errorMsg } = eventData.data;
              // Throw plain Error to match local SDK behavior (useApi: false)
              throw new Error(errorMsg);
            }
            if (eventData.data.status === "finished") {
              this.lastFinishedEventData = eventData.data;

              // If caching was bypassed for this request, suppress cache status
              // so we don't log or surface a MISS that the server emits anyway.
              const cacheEnabled = this.shouldUseCache(serverCache);
              return this.attachCacheStatus(
                eventData.data.result as T,
                method,
                cacheEnabled ? cacheStatus : null,
                cacheEnabled ? eventData : { data: {} },
              );
            }
          } else if (eventData.type === "log") {
            const msg = eventData.data.message;
            // Skip server-side internal logs that don't apply to API mode
            if (msg?.message === "Connecting to local browser") {
              continue;
            }
            this.logger(eventData.data.message);
          }
        } catch (e) {
          // Let Error instances pass through (server errors thrown above)
          // Only wrap SyntaxError from JSON.parse as parse errors
          if (e instanceof Error && !(e instanceof SyntaxError)) {
            throw e;
          }

          const errorMessage = e instanceof Error ? e.message : String(e);
          this.logger({
            category: "api",
            message: `Failed to parse SSE event: ${errorMessage}`,
            level: 0,
          });
          throw new StagehandResponseParseError(
            `Failed to parse server response: ${errorMessage}`,
          );
        }
      }

      if (done) {
        // Process any remaining data in buffer before exiting
        if (buffer.trim() && buffer.startsWith("data: ")) {
          try {
            const eventData = JSON.parse(buffer.slice(6));
            if (
              eventData.type === "system" &&
              eventData.data.status === "finished"
            ) {
              return this.attachCacheStatus(
                eventData.data.result as T,
                method,
                cacheStatus,
                eventData,
              );
            }
          } catch {
            this.logger({
              category: "api",
              message: `Incomplete data in final buffer: ${buffer.substring(0, 100)}`,
              level: 0,
            });
          }
        }
        throw new StagehandServerError(
          "Stream ended without completion signal",
        );
      }
    }
  }

  /**
   * Resolves the final cache status from the response header or SSE event data,
   * logs it, and attaches it to act/extract results before returning.
   */
  private attachCacheStatus<T>(
    result: T,
    method: string,
    cacheStatus: "HIT" | "MISS" | null,
    eventData: { data: { cacheHit?: boolean } },
  ): T {
    const finalCacheStatus =
      cacheStatus ||
      (typeof eventData.data.cacheHit === "boolean"
        ? eventData.data.cacheHit
          ? "HIT"
          : "MISS"
        : undefined);
    if (
      finalCacheStatus &&
      (method === "act" || method === "extract" || method === "observe")
    ) {
      this.logger({
        category: "cache",
        message: `${method} server cache ${finalCacheStatus.toLowerCase()}`,
        level: 1,
      });
    }
    if (
      finalCacheStatus &&
      result &&
      typeof result === "object" &&
      (method === "act" || method === "extract" || method === "observe")
    ) {
      // eslint-disable-next-line @typescript-eslint/no-explicit-any
      (result as ActResult | ExtractResult<any> | ObserveResult).cacheStatus =
        finalCacheStatus;
    }
    return result;
  }

  /**
   * Determine if caching should be enabled for a request.
   * Method-level setting takes precedence over instance-level setting.
   */
  private shouldUseCache(methodServerCache?: boolean): boolean {
    // If method-level setting is explicitly provided, use it
    if (methodServerCache !== undefined) {
      return methodServerCache;
    }
    // Otherwise, use instance-level setting
    return this.serverCache;
  }

  private async request(
    path: string,
    options: RequestInit,
    serverCache?: boolean,
  ): Promise<Response> {
    const defaultHeaders: Record<string, string> = {
      "x-bb-api-key": this.apiKey,
      ...(this.projectId ? { "x-bb-project-id": this.projectId } : {}),
      "x-bb-session-id": this.sessionId,
      // we want real-time logs, so we stream the response
      "x-stream-response": "true",
      "x-model-api-key": this.modelApiKey,
      "x-language": "typescript",
      "x-sdk-version": STAGEHAND_VERSION,
    };

    // Add cache bypass header if caching is disabled
    if (!this.shouldUseCache(serverCache)) {
      defaultHeaders["browserbase-cache-bypass"] = "true";
    }

    if (options.method === "POST" && options.body) {
      defaultHeaders["Content-Type"] = "application/json";
    }

    // Use STAGEHAND_API_URL env var if set, otherwise use region-based URL
    // Ensure /v1 suffix is present for consistency
    let baseUrl: string;
    if (process.env.STAGEHAND_API_URL) {
      const envUrl = process.env.STAGEHAND_API_URL.replace(/\/+$/, "");
      // Append /v1 if not already present
      baseUrl = envUrl.endsWith("/v1") ? envUrl : `${envUrl}/v1`;
    } else {
      baseUrl = getApiUrlForRegion(this.region);
    }

    const response = await this.fetchWithCookies(`${baseUrl}${path}`, {
      ...options,
      headers: {
        ...defaultHeaders,
        ...options.headers,
      },
    });

    return response;
  }
}


================================================
FILE: packages/core/lib/v3/cache/ActCache.ts
================================================
import { createHash } from "crypto";
import type { ActHandler } from "../handlers/actHandler.js";
import type { LLMClient } from "../llm/LLMClient.js";
import type { Action, ActResult, Logger } from "../types/public/index.js";
import type { Page } from "../understudy/page.js";
import { CacheStorage } from "./CacheStorage.js";
import { safeGetPageUrl, waitForCachedSelector } from "./utils.js";
import {
  ActCacheContext,
  ActCacheDeps,
  CachedActEntry,
} from "../types/private/index.js";
import { StagehandNotInitializedError } from "../types/public/sdkErrors.js";
import { withTimeout } from "../timeoutConfig.js";

export class ActCache {
  private readonly storage: CacheStorage;
  private readonly logger: Logger;
  private readonly getActHandler: () => ActHandler | null;
  private readonly getDefaultLlmClient: () => LLMClient;
  private readonly domSettleTimeoutMs?: number;

  constructor({
    storage,
    logger,
    getActHandler,
    getDefaultLlmClient,
    domSettleTimeoutMs,
  }: ActCacheDeps) {
    this.storage = storage;
    this.logger = logger;
    this.getActHandler = getActHandler;
    this.getDefaultLlmClient = getDefaultLlmClient;
    this.domSettleTimeoutMs = domSettleTimeoutMs;
  }

  get enabled(): boolean {
    return this.storage.enabled;
  }

  async prepareContext(
    instruction: string,
    page: Page,
    variables?: Record<string, string>,
  ): Promise<ActCacheContext | null> {
    if (!this.enabled) return null;
    const sanitizedInstruction = instruction.trim();
    const sanitizedVariables = variables ? { ...variables } : undefined;
    const variableKeys = sanitizedVariables
      ? Object.keys(sanitizedVariables).sort()
      : [];
    const pageUrl = await safeGetPageUrl(page);
    const cacheKey = this.buildActCacheKey(
      sanitizedInstruction,
      pageUrl,
      variableKeys,
    );
    return {
      instruction: sanitizedInstruction,
      cacheKey,
      pageUrl,
      variableKeys,
      variables: sanitizedVariables,
    };
  }

  async tryReplay(
    context: ActCacheContext,
    page: Page,
    timeout?: number,
    llmClientOverride?: LLMClient,
  ): Promise<ActResult | null> {
    if (!this.enabled) return null;

    const {
      value: entry,
      error,
      path,
    } = await this.storage.readJson<CachedActEntry>(`${context.cacheKey}.json`);
    if (error && path) {
      this.logger({
        category: "cache",
        message: `failed to read act cache entry: ${path}`,
        level: 2,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return null;
    }
    if (!entry) return null;
    if (entry.version !== 1) return null;
    if (!Array.isArray(entry.actions) || entry.actions.length === 0) {
      return null;
    }

    const entryVariableKeys = Array.isArray(entry.variableKeys)
      ? [...entry.variableKeys].sort()
      : [];
    const contextVariableKeys = [...context.variableKeys];

    if (!this.doVariableKeysMatch(entryVariableKeys, contextVariableKeys)) {
      return null;
    }

    if (
      contextVariableKeys.length > 0 &&
      (!context.variables ||
        !this.hasAllVariableValues(contextVariableKeys, context.variables))
    ) {
      this.logger({
        category: "cache",
        message: "act cache miss: missing variables for replay",
        level: 2,
        auxiliary: {
          instruction: { value: context.instruction, type: "string" },
        },
      });
      return null;
    }

    this.logger({
      category: "cache",
      message: "act cache hit",
      level: 1,
      auxiliary: {
        instruction: { value: context.instruction, type: "string" },
        url: {
          value: entry.url ?? context.pageUrl,
          type: "string",
        },
      },
    });

    return await this.replayCachedActions(
      context,
      entry,
      page,
      timeout,
      llmClientOverride,
    );
  }

  async store(context: ActCacheContext, result: ActResult): Promise<void> {
    if (!this.enabled) return;

    const entry: CachedActEntry = {
      version: 1,
      instruction: context.instruction,
      url: context.pageUrl,
      variableKeys: context.variableKeys,
      actions: result.actions ?? [],
      actionDescription: result.actionDescription,
      message: result.message,
    };

    const { error, path } = await this.storage.writeJson(
      `${context.cacheKey}.json`,
      entry,
    );
    if (error && path) {
      this.logger({
        category: "cache",
        message: "failed to write act cache entry",
        level: 1,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return;
    }

    this.logger({
      category: "cache",
      message: "act cache stored",
      level: 2,
      auxiliary: {
        instruction: { value: context.instruction, type: "string" },
        url: { value: context.pageUrl, type: "string" },
      },
    });
  }

  private buildActCacheKey(
    instruction: string,
    url: string,
    variableKeys: string[],
  ): string {
    const payload = JSON.stringify({
      instruction,
      url,
      variableKeys,
    });
    return createHash("sha256").update(payload).digest("hex");
  }

  private async replayCachedActions(
    context: ActCacheContext,
    entry: CachedActEntry,
    page: Page,
    timeout?: number,
    llmClientOverride?: LLMClient,
  ): Promise<ActResult> {
    const handler = this.getActHandler();
    if (!handler) {
      throw new StagehandNotInitializedError("act()");
    }
    const effectiveClient = llmClientOverride ?? this.getDefaultLlmClient();

    const execute = async (): Promise<ActResult> => {
      const actionResults: ActResult[] = [];
      for (const action of entry.actions) {
        await waitForCachedSelector({
          page,
          selector: action.selector,
          timeout: this.domSettleTimeoutMs,
          logger: this.logger,
          context: "act",
        });
        const result = await handler.takeDeterministicAction(
          action,
          page,
          this.domSettleTimeoutMs,
          effectiveClient,
          undefined,
          context.variables,
        );
        actionResults.push(result);
        if (!result.success) {
          break;
        }
      }

      if (actionResults.length === 0) {
        return {
          success: false,
          message: "Failed to perform act: cached entry has no actions",
          actionDescription: entry.actionDescription ?? entry.instruction,
          actions: [],
        };
      }

      const success = actionResults.every((r) => r.success);
      const actions = actionResults.flatMap((r) => r.actions ?? []);
      const message =
        actionResults
          .map((r) => r.message)
          .filter((m) => m && m.trim().length > 0)
          .join(" → ") ||
        entry.message ||
        `Replayed ${entry.actions.length} cached action${
          entry.actions.length === 1 ? "" : "s"
        }.`;
      const actionDescription =
        entry.actionDescription ||
        actionResults[actionResults.length - 1]?.actionDescription ||
        entry.actions[entry.actions.length - 1]?.description ||
        entry.instruction;

      if (
        success &&
        actions.length > 0 &&
        this.haveActionsChanged(entry.actions, actions)
      ) {
        await this.refreshCacheEntry(context, {
          ...entry,
          actions,
          message,
          actionDescription,
        });
      }
      return {
        success,
        message,
        actionDescription,
        actions,
      };
    };

    return await withTimeout(execute(), timeout, "act()");
  }

  private haveActionsChanged(original: Action[], updated: Action[]): boolean {
    if (original.length !== updated.length) {
      return true;
    }

    for (let i = 0; i < original.length; i += 1) {
      const orig = original[i];
      const next = updated[i];
      if (!next) {
        return true;
      }

      if (orig.selector !== next.selector) {
        return true;
      }

      if (orig.description !== next.description) {
        return true;
      }

      if ((orig.method ?? "") !== (next.method ?? "")) {
        return true;
      }

      const origArgs = orig.arguments ?? [];
      const nextArgs = next.arguments ?? [];
      if (origArgs.length !== nextArgs.length) {
        return true;
      }

      for (let j = 0; j < origArgs.length; j += 1) {
        if (origArgs[j] !== nextArgs[j]) {
          return true;
        }
      }
    }

    return false;
  }

  private async refreshCacheEntry(
    context: ActCacheContext,
    entry: CachedActEntry,
  ): Promise<void> {
    const { error, path } = await this.storage.writeJson(
      `${context.cacheKey}.json`,
      {
        ...entry,
        variableKeys: context.variableKeys,
      },
    );

    if (error && path) {
      this.logger({
        category: "cache",
        message: "failed to update act cache entry after self-heal",
        level: 0,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return;
    }

    this.logger({
      category: "cache",
      message: "act cache entry updated after self-heal",
      level: 2,
      auxiliary: {
        instruction: { value: context.instruction, type: "string" },
        url: { value: context.pageUrl, type: "string" },
      },
    });
  }

  private doVariableKeysMatch(
    entryKeys: string[],
    contextKeys: string[],
  ): boolean {
    if (entryKeys.length !== contextKeys.length) {
      return false;
    }

    for (let i = 0; i < entryKeys.length; i += 1) {
      if (entryKeys[i] !== contextKeys[i]) {
        return false;
      }
    }

    return true;
  }

  private hasAllVariableValues(
    variableKeys: string[],
    variables: Record<string, string>,
  ): boolean {
    for (const key of variableKeys) {
      if (!(key in variables)) {
        return false;
      }
    }
    return true;
  }
}


================================================
FILE: packages/core/lib/v3/cache/AgentCache.ts
================================================
import { createHash } from "crypto";
import type { ActHandler } from "../handlers/actHandler.js";
import type { LLMClient } from "../llm/LLMClient.js";
import type {
  AgentReplayActStep,
  AgentReplayFillFormStep,
  AgentReplayGotoStep,
  AgentReplayKeysStep,
  AgentReplayNavBackStep,
  AgentReplayScrollStep,
  AgentReplayStep,
  AgentReplayWaitStep,
  CachedAgentEntry,
  SanitizedAgentExecuteOptions,
  ActFn,
  AgentCacheContext,
  AgentCacheDeps,
  AgentCacheTransferPayload,
} from "../types/private/index.js";
import type {
  Action,
  AgentResult,
  AgentStreamResult,
  AgentConfig,
  AgentExecuteOptionsBase,
  AvailableModel,
  Logger,
} from "../types/public/index.js";
import type { Page } from "../understudy/page.js";
import type { V3Context } from "../understudy/context.js";
import { CacheStorage } from "./CacheStorage.js";
import {
  cloneForCache,
  safeGetPageUrl,
  waitForCachedSelector,
} from "./utils.js";

const SENSITIVE_CONFIG_KEYS = new Set(["apikey", "api_key", "api-key"]);

export class AgentCache {
  private readonly storage: CacheStorage;
  private readonly logger: Logger;
  private readonly getActHandler: () => ActHandler | null;
  private readonly getContext: () => V3Context | null;
  private readonly getDefaultLlmClient: () => LLMClient;
  private readonly getBaseModelName: () => AvailableModel;
  private readonly getSystemPrompt: () => string | undefined;
  private readonly domSettleTimeoutMs?: number;
  private readonly act: ActFn;
  private readonly bufferLatestEntry: boolean;

  private recording: AgentReplayStep[] | null = null;
  private latestEntry: AgentCacheTransferPayload | null = null;

  constructor({
    storage,
    logger,
    getActHandler,
    getContext,
    getDefaultLlmClient,
    getBaseModelName,
    getSystemPrompt,
    domSettleTimeoutMs,
    act,
    bufferLatestEntry,
  }: AgentCacheDeps) {
    this.storage = storage;
    this.logger = logger;
    this.getActHandler = getActHandler;
    this.getContext = getContext;
    this.getDefaultLlmClient = getDefaultLlmClient;
    this.getBaseModelName = getBaseModelName;
    this.getSystemPrompt = getSystemPrompt;
    this.domSettleTimeoutMs = domSettleTimeoutMs;
    this.act = act;
    this.bufferLatestEntry = bufferLatestEntry ?? false;
  }

  get enabled(): boolean {
    return this.storage.enabled;
  }

  shouldAttemptCache(instruction: string): boolean {
    return this.enabled && instruction.trim().length > 0;
  }

  sanitizeExecuteOptions(
    options?: AgentExecuteOptionsBase,
  ): SanitizedAgentExecuteOptions {
    if (!options) return {};
    const sanitized: SanitizedAgentExecuteOptions = {};
    if (typeof options.maxSteps === "number") {
      sanitized.maxSteps = options.maxSteps;
    }
    if (
      "highlightCursor" in options &&
      typeof (options as { highlightCursor?: unknown }).highlightCursor ===
        "boolean"
    ) {
      sanitized.highlightCursor = (
        options as { highlightCursor?: boolean }
      ).highlightCursor;
    }
    return sanitized;
  }

  buildConfigSignature(agentOptions?: AgentConfig): string {
    const toolKeys = agentOptions?.tools
      ? Object.keys(agentOptions.tools).sort()
      : undefined;
    const integrationSignatures = agentOptions?.integrations
      ? agentOptions.integrations.map((integration) =>
          typeof integration === "string" ? integration : "client",
        )
      : undefined;
    const serializedModel = this.serializeAgentModelForCache(
      agentOptions?.model,
    );
    const serializedExecutionModel = this.serializeAgentModelForCache(
      agentOptions?.executionModel,
    );

    const isCuaMode =
      agentOptions?.mode !== undefined
        ? agentOptions.mode === "cua"
        : agentOptions?.cua === true;

    return JSON.stringify({
      v3Model: this.getBaseModelName(),
      systemPrompt: this.getSystemPrompt() ?? "",
      agent: {
        cua: isCuaMode,
        model: serializedModel ?? null,
        executionModel: isCuaMode ? null : serializedExecutionModel,
        systemPrompt: agentOptions?.systemPrompt ?? null,
        toolKeys,
        integrations: integrationSignatures,
      },
    });
  }

  async prepareContext(params: {
    instruction: string;
    options: SanitizedAgentExecuteOptions;
    configSignature: string;
    page: Page;
    variables?: Record<string, string>;
  }): Promise<AgentCacheContext | null> {
    if (!this.shouldAttemptCache(params.instruction)) {
      return null;
    }
    const instruction = params.instruction.trim();
    const startUrl = await safeGetPageUrl(params.page);
    const variableKeys = params.variables
      ? Object.keys(params.variables).sort()
      : [];
    const cacheKey = this.buildAgentCacheKey(
      instruction,
      startUrl,
      params.options,
      params.configSignature,
      variableKeys,
    );
    return {
      instruction,
      startUrl,
      options: params.options,
      configSignature: params.configSignature,
      cacheKey,
      variableKeys,
      variables: params.variables,
    };
  }

  async tryReplay(
    context: AgentCacheContext,
    llmClientOverride?: LLMClient,
  ): Promise<AgentResult | null> {
    if (!this.enabled) return null;

    const {
      value: entry,
      error,
      path,
    } = await this.storage.readJson<CachedAgentEntry>(
      `agent-${context.cacheKey}.json`,
    );
    if (error && path) {
      this.logger({
        category: "cache",
        message: `failed to read agent cache entry: ${path}`,
        level: 1,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return null;
    }
    if (!entry || entry.version !== 1) {
      return null;
    }

    this.logger({
      category: "cache",
      message: "agent cache hit",
      level: 1,
      auxiliary: {
        instruction: { value: context.instruction, type: "string" },
        url: { value: context.startUrl, type: "string" },
      },
    });

    return await this.replayAgentCacheEntry(context, entry, llmClientOverride);
  }

  /**
   * Attempts to replay a cached agent execution and returns it as a stream result.
   *
   * This method exists because the agent API exposes two execution modes:
   * - `execute()` - Returns a Promise<AgentResult> directly
   * - `stream()` - Returns an AgentStreamResult with async iterables for real-time output
   *
   * When a cache hit occurs, we need to return the appropriate type for each mode:
   * - For `execute()`, we use `tryReplay()` which returns AgentResult
   * - For `stream()`, we use `tryReplayAsStream()` which wraps the result in a
   *   stream-compatible interface
   *
   * This ensures consumers using `stream()` can still iterate over `textStream`
   * and await `result` even when the response comes from cache, maintaining
   * API consistency regardless of whether the result was cached or live.
   */
  async tryReplayAsStream(
    context: AgentCacheContext,
    llmClientOverride?: LLMClient,
  ): Promise<AgentStreamResult | null> {
    const result = await this.tryReplay(context, llmClientOverride);
    if (!result) return null;
    return this.createCachedStreamResult(result);
  }

  /**
   * Creates a mock AgentStreamResult that wraps a cached AgentResult.
   *
   * AgentStreamResult (from the AI SDK) is a complex type with multiple async
   * iterables and promises. When serving from cache, we don't have an actual
   * LLM stream to consume - we just have the final result. This method creates
   * a "fake" stream

   * This approach lets cached responses be transparent to the consumer -
   * they can use the same iteration patterns whether the result is live or cached.
   */
  private createCachedStreamResult(
    cachedResult: AgentResult,
  ): AgentStreamResult {
    const message = cachedResult.message ?? "";

    async function* textStreamGenerator(): AsyncGenerator<string> {
      yield message;
    }

    async function* fullStreamGenerator(): AsyncGenerator<{
      type: string;
      textDelta?: string;
    }> {
      yield { type: "text-delta", textDelta: message };
      yield { type: "finish" };
    }

    const mockStreamResult = {
      textStream: textStreamGenerator(),
      fullStream: fullStreamGenerator(),
      result: Promise.resolve(cachedResult),
      text: Promise.resolve(message),
      usage: Promise.resolve({
        promptTokens: 0,
        completionTokens: 0,
        totalTokens: 0,
      }),
      finishReason: Promise.resolve("stop" as const),
      experimental_providerMetadata: Promise.resolve(undefined),
      response: Promise.resolve({
        id: "cached",
        timestamp: new Date(),
        modelId: "cached",
      }),
      rawResponse: Promise.resolve({ headers: {} }),
      warnings: Promise.resolve([]),
      steps: Promise.resolve([]),
      toolCalls: Promise.resolve([]),
      toolResults: Promise.resolve([]),
      [Symbol.asyncIterator]: () => textStreamGenerator(),
    } as unknown as AgentStreamResult;

    return mockStreamResult;
  }

  /**
   * Wraps an AgentStreamResult with caching logic.
   *
   * This method handles the complexity of caching for streaming responses:
   * 1. Begins recording agent replay steps
   * 2. Wraps the stream's result promise to capture completion
   * 3. On success: ends recording and stores the cache entry
   * 4. On error: discards the recording
   *
   * This keeps the caching orchestration in AgentCache rather than
   * spreading it across the V3 class.
   *
   * @param context - The cache context for this execution
   * @param streamResult - The stream result from the agent handler
   * @param beginRecording - Callback to start recording (from V3)
   * @param endRecording - Callback to end recording and get steps (from V3)
   * @param discardRecording - Callback to discard recording on error (from V3)
   * @returns The wrapped stream result with caching enabled
   */
  wrapStreamForCaching(
    context: AgentCacheContext,
    streamResult: AgentStreamResult,
    beginRecording: () => void,
    endRecording: () => AgentReplayStep[],
    discardRecording: () => void,
  ): AgentStreamResult {
    beginRecording();

    const originalResultPromise = streamResult.result;
    const wrappedResultPromise = originalResultPromise.then(
      async (result) => {
        const agentSteps = endRecording();

        if (result.success && agentSteps.length > 0) {
          await this.store(context, agentSteps, result);
        }

        return result;
      },
      (error) => {
        discardRecording();
        throw error;
      },
    );

    streamResult.result = wrappedResultPromise;
    return streamResult;
  }

  async store(
    context: AgentCacheContext,
    steps: AgentReplayStep[],
    result: AgentResult,
  ): Promise<void> {
    if (!this.enabled) return;

    const entry: CachedAgentEntry = {
      version: 1,
      instruction: context.instruction,
      startUrl: context.startUrl,
      options: context.options,
      configSignature: context.configSignature,
      steps: cloneForCache(steps),
      result: this.pruneAgentResult(result),
      timestamp: new Date().toISOString(),
    };

    const { error, path } = await this.storage.writeJson(
      `agent-${context.cacheKey}.json`,
      entry,
    );
    if (error && path) {
      this.logger({
        category: "cache",
        message: "failed to write agent cache entry",
        level: 1,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return;
    }

    this.logger({
      category: "cache",
      message: "agent cache stored",
      level: 2,
      auxiliary: {
        instruction: { value: context.instruction, type: "string" },
        steps: { value: String(steps.length), type: "string" },
      },
    });

    if (this.bufferLatestEntry) {
      this.latestEntry = {
        cacheKey: context.cacheKey,
        entry: cloneForCache(entry),
      };
    }
  }

  consumeBufferedEntry(): AgentCacheTransferPayload | null {
    if (!this.bufferLatestEntry || !this.latestEntry) {
      return null;
    }

    const payload = this.latestEntry;
    this.latestEntry = null;
    return payload;
  }

  async storeTransferredEntry(
    payload: AgentCacheTransferPayload | null,
  ): Promise<void> {
    if (!this.enabled || !payload) return;

    const entry = cloneForCache(payload.entry);
    const { error, path } = await this.storage.writeJson(
      `agent-${payload.cacheKey}.json`,
      entry,
    );
    if (error && path) {
      this.logger({
        category: "cache",
        message: "failed to import remote agent cache entry",
        level: 0,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return;
    }

    this.logger({
      category: "cache",
      message: "agent cache imported from server",
      level: 2,
      auxiliary: {
        instruction: { value: entry.instruction, type: "string" },
        steps: { value: String(entry.steps?.length ?? 0), type: "string" },
      },
    });
  }

  /**
   * Clone the agent result and prune bulky fields (e.g. screenshot base64 blobs)
   * before persisting it to disk. This keeps cache entries compact without
   * mutating the live AgentResult returned to callers.
   */
  private pruneAgentResult(result: AgentResult): AgentResult {
    const cloned = cloneForCache(result);
    if (!Array.isArray(cloned.actions)) {
      return cloned;
    }

    for (const action of cloned.actions) {
      if (action?.type === "screenshot") {
        delete action.base64;
      }
    }

    return cloned;
  }

  beginRecording(): void {
    this.recording = [];
  }

  endRecording(): AgentReplayStep[] {
    if (!this.recording) return [];
    const steps = cloneForCache(this.recording);
    this.recording = null;
    return steps;
  }

  discardRecording(): void {
    this.recording = null;
  }

  isRecording(): boolean {
    return Array.isArray(this.recording);
  }

  recordStep(step: AgentReplayStep): void {
    if (!this.isRecording()) return;
    try {
      this.recording!.push(cloneForCache(step));
    } catch (err) {
      this.logger({
        category: "cache",
        message: "failed to record agent replay step",
        level: 2,
        auxiliary: {
          error: { value: String(err), type: "string" },
        },
      });
    }
  }

  isReplayActive(): boolean {
    return this.isRecording();
  }

  private serializeAgentModelForCache(
    model?: AgentConfig["model"],
  ): null | string | { modelName: string; options?: Record<string, unknown> } {
    if (!model) return null;
    if (typeof model === "string") return model;

    const { modelName, ...modelOptions } = model;
    const sanitizedOptions =
      Object.keys(modelOptions).length > 0
        ? this.sanitizeModelOptionsForCache(
            modelOptions as Record<string, unknown>,
          )
        : undefined;
    return sanitizedOptions
      ? { modelName, options: sanitizedOptions }
      : modelName;
  }

  private buildAgentCacheKey(
    instruction: string,
    startUrl: string,
    options: SanitizedAgentExecuteOptions,
    configSignature: string,
    variableKeys?: string[],
  ): string {
    const payload = {
      instruction,
      startUrl,
      options,
      configSignature,
      variableKeys: variableKeys ?? [],
    };
    return createHash("sha256").update(JSON.stringify(payload)).digest("hex");
  }

  private sanitizeModelOptionsForCache(
    value: Record<string, unknown>,
  ): Record<string, unknown> | undefined {
    const sanitizedEntries: Record<string, unknown> = {};
    for (const [key, rawValue] of Object.entries(value)) {
      if (SENSITIVE_CONFIG_KEYS.has(key.toLowerCase())) {
        continue;
      }

      const sanitizedValue = this.sanitizeModelValueForCache(rawValue);
      if (sanitizedValue !== undefined) {
        sanitizedEntries[key] = sanitizedValue;
      }
    }

    return Object.keys(sanitizedEntries).length > 0
      ? sanitizedEntries
      : undefined;
  }

  private sanitizeModelValueForCache(value: unknown): unknown {
    if (Array.isArray(value)) {
      const sanitizedArray = value
        .map((item) => this.sanitizeModelValueForCache(item))
        .filter((item) => item !== undefined);
      return sanitizedArray;
    }

    if (value && typeof value === "object") {
      return this.sanitizeModelOptionsForCache(
        value as Record<string, unknown>,
      );
    }

    return value;
  }

  private async replayAgentCacheEntry(
    context: AgentCacheContext,
    entry: CachedAgentEntry,
    llmClientOverride?: LLMClient,
  ): Promise<AgentResult | null> {
    const ctx = this.getContext();
    const handler = this.getActHandler();
    if (!ctx || !handler) return null;
    const effectiveClient = llmClientOverride ?? this.getDefaultLlmClient();
    try {
      const updatedSteps: AgentReplayStep[] = [];
      let stepsChanged = false;
      for (const step of entry.steps ?? []) {
        const replayedStep =
          (await this.executeAgentReplayStep(
            step,
            ctx,
            handler,
            effectiveClient,
            context.variables,
          )) ?? step;
        stepsChanged ||= replayedStep !== step;
        updatedSteps.push(replayedStep);
      }
      const result = cloneForCache(entry.result);
      result.usage = {
        input_tokens: 0,
        output_tokens: 0,
        reasoning_tokens: 0,
        cached_input_tokens: 0,
        inference_time_ms: 0,
      };
      result.metadata = {
        ...(result.metadata ?? {}),
        cacheHit: true,
        cacheTimestamp: entry.timestamp,
      };
      if (stepsChanged) {
        await this.refreshAgentCacheEntry(context, entry, updatedSteps);
      }
      return result;
    } catch (err) {
      this.logger({
        category: "cache",
        message: "agent cache replay failed",
        level: 1,
        auxiliary: {
          error: { value: String(err), type: "string" },
        },
      });
      return null;
    }
  }

  private async executeAgentReplayStep(
    step: AgentReplayStep,
    ctx: V3Context,
    handler: ActHandler,
    llmClient: LLMClient,
    variables?: Record<string, string>,
  ): Promise<AgentReplayStep> {
    switch (step.type) {
      case "act":
        return await this.replayAgentActStep(
          step as AgentReplayActStep,
          ctx,
          handler,
          llmClient,
          variables,
        );
      case "fillForm":
        return await this.replayAgentFillFormStep(
          step as AgentReplayFillFormStep,
          ctx,
          handler,
          llmClient,
          variables,
        );
      case "goto":
        await this.replayAgentGotoStep(step as AgentReplayGotoStep, ctx);
        return step;
      case "scroll":
        await this.replayAgentScrollStep(step as AgentReplayScrollStep, ctx);
        return step;
      case "wait":
        await this.replayAgentWaitStep(step as AgentReplayWaitStep);
        return step;
      case "navback":
        await this.replayAgentNavBackStep(step as AgentReplayNavBackStep, ctx);
        return step;
      case "keys":
        await this.replayAgentKeysStep(step as AgentReplayKeysStep, ctx);
        return step;
      case "done":
      case "extract":
      case "screenshot":
      case "ariaTree":
        return step;
      default:
        this.logger({
          category: "cache",
          message: `agent cache skipping step type: ${step.type}`,
          level: 2,
        });
        return step;
    }
  }

  private async replayAgentActStep(
    step: AgentReplayActStep,
    ctx: V3Context,
    handler: ActHandler,
    llmClient: LLMClient,
    variables?: Record<string, string>,
  ): Promise<AgentReplayActStep> {
    const actions = Array.isArray(step.actions) ? step.actions : [];
    if (actions.length > 0) {
      const page = await ctx.awaitActivePage();
      const updatedActions: Action[] = [];
      for (const action of actions) {
        await waitForCachedSelector({
          page,
          selector: action.selector,
          timeout: this.domSettleTimeoutMs,
          logger: this.logger,
          context: "agent act",
        });
        const result = await handler.takeDeterministicAction(
          action,
          page,
          this.domSettleTimeoutMs,
          llmClient,
          undefined,
          variables,
        );
        if (result.success && Array.isArray(result.actions)) {
          updatedActions.push(...cloneForCache(result.actions));
        } else {
          updatedActions.push(cloneForCache(action));
        }
      }
      if (this.haveActionsChanged(actions, updatedActions)) {
        return { ...step, actions: updatedActions };
      }
      return step;
    }
    await this.act(step.instruction, { timeout: step.timeout, variables });
    return step;
  }

  private async replayAgentFillFormStep(
    step: AgentReplayFillFormStep,
    ctx: V3Context,
    handler: ActHandler,
    llmClient: LLMClient,
    variables?: Record<string, string>,
  ): Promise<AgentReplayFillFormStep> {
    const actions =
      Array.isArray(step.actions) && step.actions.length > 0
        ? step.actions
        : (step.observeResults ?? []);
    if (!Array.isArray(actions) || actions.length === 0) {
      return step;
    }
    const page = await ctx.awaitActivePage();
    const updatedActions: Action[] = [];
    for (const action of actions) {
      await waitForCachedSelector({
        page,
        selector: action.selector,
        timeout: this.domSettleTimeoutMs,
        logger: this.logger,
        context: "fillForm",
      });
      const result = await handler.takeDeterministicAction(
        action,
        page,
        this.domSettleTimeoutMs,
        llmClient,
        undefined, // ensureTimeRemaining is not used in this context
        variables,
      );
      if (result.success && Array.isArray(result.actions)) {
        updatedActions.push(...cloneForCache(result.actions));
      } else {
        updatedActions.push(cloneForCache(action));
      }
    }
    if (this.haveActionsChanged(actions, updatedActions)) {
      return { ...step, actions: updatedActions };
    }
    return step;
  }

  private async replayAgentGotoStep(
    step: AgentReplayGotoStep,
    ctx: V3Context,
  ): Promise<void> {
    const page = await ctx.awaitActivePage();
    await page.goto(step.url, { waitUntil: step.waitUntil ?? "load" });
  }

  private async replayAgentScrollStep(
    step: AgentReplayScrollStep,
    ctx: V3Context,
  ): Promise<void> {
    const page = await ctx.awaitActivePage();
    let anchor = step.anchor;
    if (!anchor) {
      anchor = await page
        .mainFrame()
        .evaluate<{ x: number; y: number }>(() => ({
          x: Math.max(0, Math.floor(window.innerWidth / 2)),
          y: Math.max(0, Math.floor(window.innerHeight / 2)),
        }));
    }
    const deltaX = step.deltaX ?? 0;
    const deltaY = step.deltaY ?? 0;
    await page.scroll(
      Math.round(anchor.x ?? 0),
      Math.round(anchor.y ?? 0),
      deltaX,
      deltaY,
    );
  }

  private async replayAgentWaitStep(step: AgentReplayWaitStep): Promise<void> {
    if (!step.timeMs || step.timeMs <= 0) return;
    await new Promise((resolve) => setTimeout(resolve, step.timeMs));
  }

  private async replayAgentNavBackStep(
    step: AgentReplayNavBackStep,
    ctx: V3Context,
  ): Promise<void> {
    const page = await ctx.awaitActivePage();
    await page.goBack({ waitUntil: step.waitUntil ?? "domcontentloaded" });
  }

  private async replayAgentKeysStep(
    step: AgentReplayKeysStep,
    ctx: V3Context,
  ): Promise<void> {
    const page = await ctx.awaitActivePage();
    const { method, text, keys, times } = step.playwrightArguments;
    const repeatCount = Math.max(1, times ?? 1);

    if (method === "type" && text) {
      for (let i = 0; i < repeatCount; i++) {
        await page.type(text, { delay: 100 });
      }
    } else if (method === "press" && keys) {
      for (let i = 0; i < repeatCount; i++) {
        await page.keyPress(keys, { delay: 100 });
      }
    }
  }

  private haveActionsChanged(original: Action[], updated: Action[]): boolean {
    if (original.length !== updated.length) {
      return true;
    }
    for (let i = 0; i < original.length; i += 1) {
      const orig = original[i];
      const next = updated[i];
      if (!orig || !next) {
        return true;
      }
      if (orig.selector !== next.selector) {
        return true;
      }
      if ((orig.description ?? "") !== (next.description ?? "")) {
        return true;
      }
      if ((orig.method ?? "") !== (next.method ?? "")) {
        return true;
      }
      const origArgs = Array.isArray(orig.arguments) ? orig.arguments : [];
      const nextArgs = Array.isArray(next.arguments) ? next.arguments : [];
      if (origArgs.length !== nextArgs.length) {
        return true;
      }
      for (let j = 0; j < origArgs.length; j += 1) {
        if (origArgs[j] !== nextArgs[j]) {
          return true;
        }
      }
    }
    return false;
  }

  private async refreshAgentCacheEntry(
    context: AgentCacheContext,
    entry: CachedAgentEntry,
    updatedSteps: AgentReplayStep[],
  ): Promise<void> {
    const updatedEntry: CachedAgentEntry = {
      ...entry,
      steps: cloneForCache(updatedSteps),
      timestamp: new Date().toISOString(),
    };
    const { error, path } = await this.storage.writeJson(
      `agent-${context.cacheKey}.json`,
      updatedEntry,
    );
    if (error && path) {
      this.logger({
        category: "cache",
        message: "failed to update agent cache entry after self-heal",
        level: 0,
        auxiliary: {
          error: { value: String(error), type: "string" },
        },
      });
      return;
    }
    this.logger({
      category: "cache",
      message: "agent cache entry updated after self-heal",
      level: 2,
      auxiliary: {
        instruction: { value: context.instruction, type: "string" },
        steps: { value: String(updatedSteps.length), type: "string" },
      },
    });
  }
}


================================================
FILE: packages/core/lib/v3/cache/CacheStorage.ts
================================================
import fs from "fs";
import path from "path";
import type { Logger } from "../types/public/index.js";
import { ReadJsonResult, WriteJsonResult } from "../types/private/index.js";

const jsonClone = <T>(value: T): T => {
  const serialized = JSON.stringify(value);
  if (serialized === undefined) {
    return value;
  }
  return JSON.parse(serialized) as T;
};

export class CacheStorage {
  private constructor(
    private readonly logger: Logger,
    private readonly dir?: string,
    private readonly memoryStore?: Map<string, unknown>,
  ) {}

  static create(
    cacheDir: string | undefined,
    logger: Logger,
    options?: { label?: string },
  ): CacheStorage {
    if (!cacheDir) {
      return new CacheStorage(logger);
    }

    const resolved = path.resolve(cacheDir);
    try {
      fs.mkdirSync(resolved, { recursive: true });
      return new CacheStorage(logger, resolved);
    } catch (err) {
      const label = options?.label ?? "cache directory";
      logger({
        category: "cache",
        message: `unable to initialize ${label}: ${resolved}`,
        level: 1,
        auxiliary: {
          error: { value: String(err), type: "string" },
        },
      });
      return new CacheStorage(logger);
    }
  }

  static createMemory(logger: Logger): CacheStorage {
    return new CacheStorage(logger, undefined, new Map());
  }

  get directory(): string | undefined {
    return this.dir;
  }

  get enabled(): boolean {
    return !!this.dir || !!this.memoryStore;
  }

  private resolvePath(fileName: string): string | null {
    if (!this.dir) return null;
    return path.join(this.dir, fileName);
  }

  async readJson<T>(fileName: string): Promise<ReadJsonResult<T>> {
    if (this.memoryStore) {
      if (!this.memoryStore.has(fileName)) {
        return { value: null };
      }
      const existing = this.memoryStore.get(fileName) as T;
      return { value: jsonClone(existing) };
    }

    const filePath = this.resolvePath(fileName);
    if (!filePath) {
      return { value: null };
    }

    try {
      const raw = await fs.promises.readFile(filePath, "utf8");
      return { value: JSON.parse(raw) as T };
    } catch (err) {
      const code = (err as NodeJS.ErrnoException)?.code;
      if (code === "ENOENT") {
        return { value: null };
      }
      return { value: null, error: err, path: filePath };
    }
  }

  async writeJson(fileName: string, data: unknown): Promise<WriteJsonResult> {
    if (this.memoryStore) {
      this.memoryStore.set(fileName, jsonClone(data));
      return {};
    }

    const filePath = this.resolvePath(fileName);
    if (!filePath) {
      return {};
    }

    try {
      await fs.promises.mkdir(path.dirname(filePath), { recursive: true });
      await fs.promises.writeFile(
        filePath,
        JSON.stringify(data, null, 2),
        "utf8",
      );
      return {};
    } catch (err) {
      return { error: err, path: filePath };
    }
  }
}


================================================
FILE: packages/core/lib/v3/cache/serverAgentCache.ts
================================================
import { AgentCache } from "./AgentCache.js";
import { CacheStorage } from "./CacheStorage.js";
import type { V3 } from "../v3.js";
import type { AgentCacheTransferPayload } from "../types/private/index.js";
import type { ActHandler } from "../handlers/actHandler.js";
import type { V3Context } from "../understudy/context.js";
import type { AvailableModel, V3Options } from "../types/public/index.js";
import type { ModelConfiguration } from "../types/public/model.js";
import type { LLMClient } from "../llm/LLMClient.js";

export interface ServerAgentCacheHandle {
  complete(): AgentCacheTransferPayload | null;
  discard(): void;
}

// TODO (refactor-caching): this reflective access is a known temporary escape hatch.
// Once the caching internals are reworked, replace it with proper V3 helpers so
// we stop poking private fields from the outside.
function getInternalField<T>(instance: V3, key: string): T {
  return (instance as unknown as Record<string, unknown>)[key] as T;
}

function setInternalField(instance: V3, key: string, value: unknown): void {
  (instance as unknown as Record<string, unknown>)[key] = value;
}

function createMemoryAgentCache(stagehand: V3): AgentCache {
  const resolveLlmClient = getInternalField<
    (model?: ModelConfiguration) => LLMClient
  >(stagehand, "resolveLlmClient");

  return new AgentCache({
    storage: CacheStorage.createMemory(stagehand.logger),
    logger: stagehand.logger,
    getActHandler: () =>
      getInternalField<ActHandler | null>(stagehand, "actHandler"),
    getContext: () => getInternalField<V3Context | null>(stagehand, "ctx"),
    getDefaultLlmClient: () => resolveLlmClient.call(stagehand),
    getBaseModelName: () =>
      getInternalField<AvailableModel>(stagehand, "modelName"),
    getSystemPrompt: () =>
      getInternalField<V3Options>(stagehand, "opts").systemPrompt,
    domSettleTimeoutMs: getInternalField<number | undefined>(
      stagehand,
      "domSettleTimeoutMs",
    ),
    act: stagehand.act.bind(stagehand),
    bufferLatestEntry: true,
  });
}

export function __internalCreateInMemoryAgentCacheHandle(
  stagehand: V3,
): ServerAgentCacheHandle {
  const originalCache = getInternalField<AgentCache>(stagehand, "agentCache");
  const memoryCache = createMemoryAgentCache(stagehand);

  setInternalField(stagehand, "agentCache", memoryCache);
  let restored = false;
  const restore = () => {
    if (!restored) {
      setInternalField(stagehand, "agentCache", originalCache);
      restored = true;
    }
  };

  return {
    complete: () => {
      const entry = memoryCache.consumeBufferedEntry();
      restore();
      return entry;
    },
    discard: () => {
      restore();
    },
  };
}


================================================
FILE: packages/core/lib/v3/cache/utils.ts
================================================
import type { Logger } from "../types/public/index.js";
import { Page } from "../understudy/page.js";

const DEFAULT_WAIT_TIMEOUT_MS = 15000;

export function cloneForCache<T>(value: T): T {
  return JSON.parse(JSON.stringify(value)) as T;
}

export async function safeGetPageUrl(page: Page): Promise<string> {
  try {
    return page.url();
  } catch {
    return "";
  }
}

/**
 * Waits for a cached action's selector to be attached to the DOM before executing.
 * Logs a warning and proceeds if the wait times out (non-blocking).
 */
export async function waitForCachedSelector(params: {
  page: Page;
  selector: string | undefined;
  timeout: number | undefined;
  logger: Logger;
  context?: string;
}): Promise<void> {
  const { page, selector, timeout, logger, context } = params;
  if (!selector) return;

  try {
    await page.waitForSelector(selector, {
      state: "attached",
      timeout: timeout ?? DEFAULT_WAIT_TIMEOUT_MS,
    });
  } catch (err) {
    logger({
      category: "cache",
      message: `waitForSelector failed for ${context ?? "cached"} action selector, proceeding anyway`,
      level: 2,
      auxiliary: {
        selector: { value: selector, type: "string" },
        error: { value: String(err), type: "string" },
      },
    });
  }
}


================================================
FILE: packages/core/lib/v3/cli.js
================================================
#!/usr/bin/env node

import process from "node:process";
import { maybeRunShutdownSupervisorFromArgv } from "./shutdown/supervisor.js";

// currently the CLI is only used to spawn the shutdown supervisor
// in the future, we may want to add more CLI commands here
if (!maybeRunShutdownSupervisorFromArgv(process.argv.slice(2))) {
  console.error(
    "Unsupported stagehand CLI invocation. Expected --supervisor with valid args.",
  );
  process.exit(1);
}


================================================
FILE: packages/core/lib/v3/dom/a11yScripts/index.ts
================================================
export function getScrollOffsets(): { sx: number; sy: number } {
  try {
    const sx =
      window.scrollX ??
      window.pageXOffset ??
      document.documentElement?.scrollLeft ??
      0;
    const sy =
      window.scrollY ??
      window.pageYOffset ??
      document.documentElement?.scrollTop ??
      0;
    return { sx: Number(sx) || 0, sy: Number(sy) || 0 };
  } catch {
    return { sx: 0, sy: 0 };
  }
}

export function getBoundingRectLite(this: Element): {
  left: number;
  top: number;
} {
  try {
    const rect = this.getBoundingClientRect();
    return {
      left: Number(rect?.left ?? 0) || 0,
      top: Number(rect?.top ?? 0) || 0,
    };
  } catch {
    return { left: 0, top: 0 };
  }
}

export function resolveDeepActiveElement(): Element | null {
  try {
    const deepActive = (doc: Document | ShadowRoot): Element | null => {
      let el: Element | null = doc.activeElement ?? null;
      while (el && el.shadowRoot && el.shadowRoot.activeElement) {
        el = el.shadowRoot.activeElement;
      }
      return el ?? null;
    };
    return deepActive(document);
  } catch {
    return null;
  }
}

export function nodeToAbsoluteXPath(this: Node | null | undefined): string {
  const compute = (node: Node | null | undefined): string => {
    try {
      const sibIndex = (n: Node | null | undefined): number => {
        if (!n || !n.parentNode) return 1;
        let i = 1;
        const targetKey = `${n.nodeType}:${(n.nodeName || "").toLowerCase()}`;
        for (let p = n.previousSibling; p; p = p.previousSibling) {
          const key = `${p.nodeType}:${(p.nodeName || "").toLowerCase()}`;
          if (key === targetKey) i += 1;
        }
        return i;
      };

      const step = (n: Node | null | undefined): string => {
        if (!n) return "";
        if (n.nodeType === Node.DOCUMENT_NODE) return "";
        if (n.nodeType === Node.DOCUMENT_FRAGMENT_NODE) return "//";
        if (n.nodeType === Node.TEXT_NODE) return `text()[${sibIndex(n)}]`;
        if (n.nodeType === Node.COMMENT_NODE)
          return `comment()[${sibIndex(n)}]`;
        const tag = (n.nodeName || "").toLowerCase();
        const name = tag.includes(":") ? `*[name()='${tag}']` : tag;
        return `${name}[${sibIndex(n)}]`;
      };

      const parts: string[] = [];
      let cur: Node | null | undefined = node;
      while (cur) {
        if (cur.nodeType === Node.DOCUMENT_FRAGMENT_NODE) {
          parts.push("//");
          cur = (cur as ShadowRoot).host ?? null;
          continue;
        }
        const s = step(cur);
        if (s) parts.push(s);
        cur = cur.parentNode;
      }
      parts.reverse();

      let out = "";
      for (const part of parts) {
        if (part === "//") {
          out = out ? (out.endsWith("/") ? `${out}/` : `${out}//`) : "//";
        } else {
          out = out
            ? out.endsWith("/")
              ? `${out}${part}`
              : `${out}/${part}`
            : `/${part}`;
        }
      }
      return out || "/";
    } catch {
      return "/";
    }
  };

  return compute(this);
}

export function documentHasFocusStrict(): boolean {
  try {
    return document.hasFocus() === true;
  } catch {
    return false;
  }
}


================================================
FILE: packages/core/lib/v3/dom/genA11yScripts.ts
================================================
import fs from "node:fs";
import path from "node:path";
import { pathToFileURL } from "node:url";
import esbuild from "esbuild";
import { getCurrentDirPath } from "../runtimePaths.js";

const here = getCurrentDirPath();
const srcDir = path.join(here, "./a11yScripts");
const outDir = path.join(here, "./build");
const entry = path.join(srcDir, "index.ts");
const moduleOut = path.join(outDir, "a11yScripts.mjs");
const bundleOut = path.join(outDir, "a11yScripts.bundle.js");

async function main(): Promise<void> {
  fs.mkdirSync(outDir, { recursive: true });

  esbuild.buildSync({
    entryPoints: [entry],
    bundle: true,
    format: "esm",
    platform: "browser",
    target: "es2020",
    minify: true,
    outfile: moduleOut,
  });

  esbuild.buildSync({
    entryPoints: [entry],
    bundle: true,
    format: "iife",
    platform: "browser",
    target: "es2020",
    globalName: "__stagehandA11yScriptsFactory",
    minify: true,
    outfile: bundleOut,
  });

  const bundleRaw = fs.readFileSync(bundleOut, "utf8").trim();
  const bootstrap = `if (!globalThis.__stagehandA11yScripts) { ${bundleRaw}\n  globalThis.__stagehandA11yScripts = __stagehandA11yScriptsFactory;\n}`;

  const compiledModule = (await import(
    pathToFileURL(moduleOut).href
  )) as Record<string, unknown>;

  const entries = Object.entries(compiledModule).filter(
    ([, value]) => typeof value === "function",
  );
  const sorted = entries.sort(([a], [b]) => a.localeCompare(b));

  const scriptMap: Record<string, string> = Object.fromEntries(
    sorted.map(([name, fn]) => {
      const callable = fn as (...args: unknown[]) => unknown;
      return [name, callable.toString()];
    }),
  );

  const banner = `/*\n * AUTO-GENERATED FILE. DO NOT EDIT.\n * Update sources in lib/v3/dom/a11yScripts and run genA11yScripts.ts.\n */`;

  const globalRefs: Record<string, string> = Object.fromEntries(
    sorted.map(([name]) => [name, `globalThis.__stagehandA11yScripts.${name}`]),
  );

  const content = `${banner}
export const a11yScriptBootstrap = ${JSON.stringify(bootstrap)};
export const a11yScriptSources = ${JSON.stringify(scriptMap, null, 2)} as const;
export const a11yScriptGlobalRefs = ${JSON.stringify(globalRefs, null, 2)} as const;
export type A11yScriptName = keyof typeof a11yScriptSources;
`;

  fs.writeFileSync(path.join(outDir, "a11yScripts.generated.ts"), content);

  await fs.promises.unlink(moduleOut).catch(() => {});
  await fs.promises.unlink(bundleOut).catch(() => {});
}

void main();


================================================
FILE: packages/core/lib/v3/dom/genDomScripts.ts
================================================
/**
 * Build the v3 DOM script into a single JS file and then export its contents
 * as a string constant (`v3ScriptContent`) for CDP injection (document-start).
 */
import fs from "node:fs";
import path from "node:path";
import esbuild from "esbuild";
import { getCurrentDirPath } from "../runtimePaths.js";

const here = getCurrentDirPath();
const outDir = path.join(here, "./build");
fs.mkdirSync(outDir, { recursive: true });

esbuild.buildSync({
  entryPoints: [path.join(here, "piercer.entry.ts")],
  bundle: true,
  format: "iife",
  platform: "browser",
  target: "es2020",
  minify: true,
  legalComments: "none",
  outfile: path.join(outDir, "v3-index.js"),
});

const script = fs.readFileSync(path.join(outDir, "v3-index.js"), "utf8");
const content = `export const v3ScriptContent = ${JSON.stringify(script)};`;

fs.writeFileSync(path.join(outDir, "scriptV3Content.ts"), content);

esbuild.buildSync({
  entryPoints: [path.join(here, "rerenderMissingShadows.entry.ts")],
  bundle: true,
  format: "iife",
  platform: "browser",
  target: "es2020",
  minify: true,
  legalComments: "none",
  outfile: path.join(outDir, "rerender-index.js"),
});

const rerenderScript = fs.readFileSync(
  path.join(outDir, "rerender-index.js"),
  "utf8",
);
const rerenderContent = `export const reRenderScriptContent = ${JSON.stringify(
  rerenderScript,
)};`;
fs.writeFileSync(
  path.join(outDir, "reRenderScriptContent.ts"),
  rerenderContent,
);


================================================
FILE: packages/core/lib/v3/dom/genLocatorScripts.ts
================================================
import fs from "node:fs";
import path from "node:path";
import { pathToFileURL } from "node:url";
import esbuild from "esbuild";
import { getCurrentDirPath } from "../runtimePaths.js";

const here = getCurrentDirPath();
const outDir = path.join(here, "./build");
const entry = path.join(here, "./locatorScripts/index.ts");
const moduleOutfile = path.join(outDir, "locatorScripts.mjs");
const bundleOutfile = path.join(outDir, "locatorScripts.bundle.js");

async function main(): Promise<void> {
  fs.mkdirSync(outDir, { recursive: true });

  esbuild.buildSync({
    entryPoints: [entry],
    bundle: true,
    format: "esm",
    platform: "browser",
    target: "es2020",
    minify: true,
    outfile: moduleOutfile,
  });

  esbuild.buildSync({
    entryPoints: [entry],
    bundle: true,
    format: "iife",
    platform: "browser",
    target: "es2020",
    globalName: "__stagehandLocatorScriptsFactory",
    minify: true,
    outfile: bundleOutfile,
  });

  const bundleRaw = fs.readFileSync(bundleOutfile, "utf8").trim();
  const bootstrap = `if (!globalThis.__stagehandLocatorScripts) { ${bundleRaw}\n  globalThis.__stagehandLocatorScripts = __stagehandLocatorScriptsFactory;\n}`;

  const compiledModule = (await import(
    pathToFileURL(moduleOutfile).href
  )) as Record<string, unknown>;

  const entries = Object.entries(compiledModule).filter(
    ([, value]) => typeof value === "function",
  );
  const sorted = entries.sort(([a], [b]) => a.localeCompare(b));

  const scriptMap: Record<string, string> = Object.fromEntries(
    sorted.map(([name, fn]) => {
      const callable = fn as (...args: unknown[]) => unknown;
      return [name, callable.toString()];
    }),
  );

  const banner = `/*\n * AUTO-GENERATED FILE. DO NOT EDIT.\n * Update sources in lib/v3/dom/locatorScripts and run genLocatorScripts.ts.\n */`;

  const globalRefs: Record<string, string> = Object.fromEntries(
    sorted.map(([name]) => [
      name,
      `globalThis.__stagehandLocatorScripts.${name}`,
    ]),
  );

  const content = `${banner}\nexport const locatorScriptBootstrap = ${JSON.stringify(bootstrap)};\nexport const locatorScriptSources = ${JSON.stringify(scriptMap, null, 2)} as const;\nexport const locatorScriptGlobalRefs = ${JSON.stringify(globalRefs, null, 2)} as const;\nexport type LocatorScriptName = keyof typeof locatorScriptSources;\n`;

  fs.writeFileSync(path.join(outDir, "locatorScripts.generated.ts"), content);

  await fs.promises.unlink(moduleOutfile).catch(() => {});
  await fs.promises.unlink(bundleOutfile).catch(() => {});
}

void main();


================================================
FILE: packages/core/lib/v3/dom/genScreenshotScripts.ts
================================================
import fs from "node:fs";
import path from "node:path";
import { pathToFileURL } from "node:url";
import esbuild from "esbuild";
import { getCurrentDirPath } from "../runtimePaths.js";

const here = getCurrentDirPath();
const srcDir = path.join(here, "./screenshotScripts");
const outDir = path.join(here, "./build");
const entry = path.join(srcDir, "index.ts");
const moduleOut = path.join(outDir, "screenshotScripts.mjs");

async function main(): Promise<void> {
  fs.mkdirSync(outDir, { recursive: true });

  esbuild.buildSync({
    entryPoints: [entry],
    bundle: true,
    format: "esm",
    platform: "browser",
    target: "es2020",
    minify: true,
    outfile: moduleOut,
  });

  const compiledModule = (await import(
    pathToFileURL(moduleOut).href
  )) as Record<string, unknown>;

  const entries = Object.entries(compiledModule).filter(
    ([, value]) => typeof value === "function",
  );
  const sorted = entries.sort(([a], [b]) => a.localeCompare(b));

  const scriptMap: Record<string, string> = Object.fromEntries(
    sorted.map(([name, fn]) => {
      const callable = fn as (...args: unknown[]) => unknown;
      return [name, callable.toString()];
    }),
  );

  const banner = `/*\n * AUTO-GENERATED FILE. DO NOT EDIT.\n * Update sources in lib/v3/dom/screenshotScripts and run genScreenshotScripts.ts.\n */`;

  const content = `${banner}
export const screenshotScriptSources = ${JSON.stringify(scriptMap, null, 2)} as const;
export type ScreenshotScriptName = keyof typeof screenshotScriptSources;
`;

  fs.writeFileSync(
    path.join(outDir, "screenshotScripts.generated.ts"),
    content,
  );

  await fs.promises.unlink(moduleOut).catch(() => {});
}

void main();


================================================
FILE: packages/core/lib/v3/dom/global.d.ts
================================================
export interface StagehandV3Backdoor {
  /** Closed shadow-root accessors */
  getClosedRoot(host: Element): ShadowRoot | undefined;
  /** Stats + quick health check */
  stats(): {
    installed: true;
    url: string;
    isTop: boolean;
    open: number;
    closed: number;
  };
}

declare global {
  interface Window {
    __stagehandV3Injected?: boolean;
    __stagehandV3__?: StagehandV3Backdoor;
  }
}


================================================
FILE: packages/core/lib/v3/dom/index.ts
================================================
export * from "./piercer.runtime.js";


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/counts.ts
================================================
import { countXPathMatches } from "./xpathResolver.js";

export interface TextMatchSample {
  tag: string;
  id: string;
  class: string;
  text: string;
}

export interface TextMatchResult {
  count: number;
  sample: TextMatchSample[];
  error: null;
}

export function countCssMatchesPrimary(selectorRaw: string): number {
  const selector = String(selectorRaw ?? "").trim();
  if (!selector) return 0;

  const seen = new WeakSet<Node>();

  const visit = (root: Node | null | undefined): number => {
    if (!root || seen.has(root)) return 0;
    seen.add(root);

    let total = 0;
    try {
      const queryable = root as unknown as ParentNode & {
        querySelectorAll?: Document["querySelectorAll"];
      };
      if (typeof queryable.querySelectorAll === "function") {
        total += queryable.querySelectorAll(selector).length;
      }
    } catch {
      // ignore query errors
    }

    try {
      const doc =
        root instanceof Document
          ? root
          : ((root as Element)?.ownerDocument ?? document);
      const walker = doc.createTreeWalker(root, NodeFilter.SHOW_ELEMENT);
      let node: Node | null;
      while ((node = walker.nextNode())) {
        if (node instanceof Element && node.shadowRoot) {
          total += visit(node.shadowRoot);
        }
      }
    } catch {
      // ignore traversal errors
    }

    return total;
  };

  try {
    return visit(document);
  } catch {
    try {
      return document.querySelectorAll(selector).length;
    } catch {
      return 0;
    }
  }
}

export function countCssMatchesPierce(selectorRaw: string): number {
  const selector = String(selectorRaw ?? "").trim();
  if (!selector) return 0;

  const backdoor = window.__stagehandV3__;
  if (!backdoor || typeof backdoor.getClosedRoot !== "function") {
    try {
      return document.querySelectorAll(selector).length;
    } catch {
      return 0;
    }
  }

  const seen = new WeakSet<Node>();
  const queue: Node[] = [];

  const enqueue = (node: Node | null | undefined) => {
    if (!node || seen.has(node)) return;
    seen.add(node);
    queue.push(node);
  };

  enqueue(document);
  let total = 0;

  const visitElement = (element: Element) => {
    const open = element.shadowRoot;
    if (open) enqueue(open);
    try {
      const closed = backdoor.getClosedRoot(element);
      if (closed) enqueue(closed);
    } catch {
      // ignore
    }
  };

  while (queue.length) {
    const root = queue.shift();
    if (!root) continue;

    try {
      const queryable = root as unknown as ParentNode & {
        querySelectorAll?: Document["querySelectorAll"];
      };
      if (typeof queryable.querySelectorAll === "function") {
        total += queryable.querySelectorAll(selector).length;
      }
    } catch {
      // ignore query errors
    }

    try {
      const doc =
        root instanceof Document
          ? root
          : root instanceof ShadowRoot
            ? (root.host?.ownerDocument ?? document)
            : ((root as Element).ownerDocument ?? document);
      const walker = doc.createTreeWalker(root, NodeFilter.SHOW_ELEMENT);
      let node: Node | null;
      while ((node = walker.nextNode())) {
        if (node instanceof Element) {
          visitElement(node);
        }
      }
    } catch {
      // ignore traversal errors
    }
  }

  return total;
}

export function countTextMatches(rawNeedle: string): TextMatchResult {
  const needle = String(rawNeedle ?? "");
  if (!needle) {
    return { count: 0, sample: [], error: null };
  }

  const needleLc = needle.toLowerCase();
  const skipTags = new Set([
    "SCRIPT",
    "STYLE",
    "TEMPLATE",
    "NOSCRIPT",
    "HEAD",
    "TITLE",
    "LINK",
    "META",
    "HTML",
    "BODY",
  ]);

  const shouldSkip = (node: Element | null | undefined): boolean => {
    if (!node) return false;
    const tag = node.tagName?.toUpperCase() ?? "";
    return skipTags.has(tag);
  };

  const extractText = (element: Element): string => {
    try {
      if (shouldSkip(element)) return "";
      const inner = (element as HTMLElement).innerText;
      if (typeof inner === "string" && inner.trim()) return inner.trim();
    } catch {
      // ignore
    }
    try {
      const text = element.textContent;
      if (typeof text === "string") return text.trim();
    } catch {
      // ignore
    }
    return "";
  };

  const matches = (element: Element): boolean => {
    const text = extractText(element);
    return !!text && text.toLowerCase().includes(needleLc);
  };

  const backdoor = window.__stagehandV3__;
  const getClosedRoot: (host: Element) => ShadowRoot | null =
    backdoor && typeof backdoor.getClosedRoot === "function"
      ? (host: Element): ShadowRoot | null => {
          try {
            return backdoor.getClosedRoot(host) ?? null;
          } catch {
            return null;
          }
        }
      : (host: Element): ShadowRoot | null => {
          void host;
          return null;
        };

  const seen = new WeakSet<Node>();
  const queue: Node[] = [];

  const enqueue = (node: Node | null | undefined) => {
    if (!node || seen.has(node)) return;
    seen.add(node);
    queue.push(node);
  };

  const walkerFor = (root: Node): TreeWalker | null => {
    try {
      const doc =
        root instanceof Document
          ? root
          : ((root as Element)?.ownerDocument ?? document);
      return doc.createTreeWalker(root, NodeFilter.SHOW_ELEMENT);
    } catch {
      return null;
    }
  };

  const matchesList: Array<{
    element: Element;
    tag: string;
    id: string;
    className: string;
    text: string;
  }> = [];

  enqueue(document);

  while (queue.length) {
    const root = queue.shift();
    if (!root) continue;

    if (root instanceof Element && matches(root)) {
      matchesList.push({
        element: root,
        tag: root.tagName ?? "",
        id: root.id ?? "",
        className: (root as HTMLElement).className ?? "",
        text: extractText(root),
      });
    }

    const walker = walkerFor(root);
    if (!walker) continue;

    let node: Node | null;
    while ((node = walker.nextNode())) {
      if (!(node instanceof Element)) continue;

      if (matches(node)) {
        matchesList.push({
          element: node,
          tag: node.tagName ?? "",
          id: node.id ?? "",
          className: (node as HTMLElement).className ?? "",
          text: extractText(node),
        });
      }

      const open = node.shadowRoot;
      if (open) enqueue(open);

      const closed = getClosedRoot(node);
      if (closed) enqueue(closed);
    }
  }

  const innermost: typeof matchesList = [];
  for (const item of matchesList) {
    const el = item.element;
    let skip = false;
    for (const other of matchesList) {
      if (item === other) continue;
      try {
        if (el.contains(other.element)) {
          skip = true;
          break;
        }
      } catch {
        // ignore containment errors
      }
    }
    if (!skip) innermost.push(item);
  }

  const count = innermost.length;
  const sample = innermost.slice(0, 5).map((item) => ({
    tag: item.tag,
    id: item.id,
    class: item.className,
    text: item.text,
  }));

  return { count, sample, error: null };
}

export function countXPathMatchesMainWorld(rawXp: string): number {
  return countXPathMatches(rawXp, { pierceShadow: true });
}


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/index.ts
================================================
export * from "./scripts.js";
export * from "./selectors.js";
export * from "./counts.js";
export * from "./waitForSelector.js";


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/scripts.ts
================================================
/*
 * DOM-side helpers used by Locator Runtime.callFunctionOn invocations.
 *
 * NOTE: These functions run inside the page context. Keep them dependency-free
 * and resilient to exceptions (match the best-effort semantics of the old
 * inline string snippets).
 */

export interface ClickEventOptions {
  bubbles?: boolean;
  cancelable?: boolean;
  composed?: boolean;
  detail?: number;
}

export function ensureFileInputElement(this: Element): boolean {
  try {
    const tag = (this as HTMLElement).tagName?.toLowerCase() ?? "";
    if (tag !== "input") return false;
    const type = String((this as HTMLInputElement).type ?? "").toLowerCase();
    return type === "file";
  } catch {
    return false;
  }
}

export interface SerializedFilePayload {
  name: string;
  mimeType: string;
  base64: string;
  lastModified?: number;
}

/** Attach File objects created from serialized payloads to an <input type="file">. */
export function assignFilePayloadsToInputElement(
  this: Element,
  payloads: SerializedFilePayload[],
): boolean {
  try {
    const input = this as HTMLInputElement;
    if (!input || input.tagName?.toLowerCase() !== "input") return false;
    if ((input.type ?? "").toLowerCase() !== "file") return false;

    const transfer: DataTransfer | null = (() => {
      try {
        return new DataTransfer();
      } catch {
        return null;
      }
    })();
    if (!transfer) return false;

    const entries = Array.isArray(payloads) ? payloads : [];
    for (const payload of entries) {
      if (!payload) continue;
      const name = payload.name || "upload.bin";
      const mimeType = payload.mimeType || "application/octet-stream";
      const lastModified =
        typeof payload.lastModified === "number"
          ? payload.lastModified
          : Date.now();

      const binary = window.atob(payload.base64 ?? "");
      const bytes = new Uint8Array(binary.length);
      for (let i = 0; i < binary.length; i += 1) {
        bytes[i] = binary.charCodeAt(i);
      }
      const blob = new Blob([bytes], { type: mimeType });
      const file = new File([blob], name, { type: mimeType, lastModified });
      transfer.items.add(file);
    }

    input.files = transfer.files;
    input.dispatchEvent(new Event("input", { bubbles: true }));
    input.dispatchEvent(new Event("change", { bubbles: true }));
    return true;
  } catch {
    return false;
  }
}

export function dispatchDomClick(
  this: Element,
  options?: ClickEventOptions,
): void {
  const opts = options ?? {};
  try {
    const event = new MouseEvent("click", {
      bubbles: !!opts.bubbles,
      cancelable: !!opts.cancelable,
      composed: !!opts.composed,
      detail: typeof opts.detail === "number" ? opts.detail : 1,
      view: this?.ownerDocument?.defaultView ?? window,
    });
    this.dispatchEvent(event);
  } catch {
    try {
      // Fallback to native click if MouseEvent construction fails.
      (this as HTMLElement).click();
    } catch {
      /* ignore */
    }
  }
}

export function scrollElementToPercent(
  this: Element,
  percent: number | string,
): boolean {
  const normalize = (value: unknown): number => {
    if (typeof value === "number" && Number.isFinite(value)) return value;
    const str = String(value ?? "").trim();
    if (!str) return 0;
    const numeric = parseFloat(str.replace("%", ""));
    if (Number.isNaN(numeric) || !Number.isFinite(numeric)) return 0;
    return numeric;
  };

  try {
    const pct = Math.max(0, Math.min(normalize(percent), 100));
    const element = this as HTMLElement;
    const tag = element.tagName?.toLowerCase() ?? "";

    const scrollWindow = tag === "html" || tag === "body";
    if (scrollWindow) {
      const root =
        element.ownerDocument?.scrollingElement ||
        element.ownerDocument?.documentElement ||
        element.ownerDocument?.body ||
        document.scrollingElement ||
        document.documentElement ||
        document.body;
      const scrollHeight =
        root?.scrollHeight ?? document.body.scrollHeight ?? 0;
      const viewportHeight =
        element.ownerDocument?.defaultView?.innerHeight ?? window.innerHeight;
      const maxTop = Math.max(0, scrollHeight - viewportHeight);
      const top = maxTop * (pct / 100);
      element.ownerDocument?.defaultView?.scrollTo({
        top,
        left:
          element.ownerDocument?.defaultView?.scrollX ?? window.scrollX ?? 0,
        behavior: "smooth",
      });
      return true;
    }

    const scrollHeight = element.scrollHeight ?? 0;
    const clientHeight = element.clientHeight ?? 0;
    const maxTop = Math.max(0, scrollHeight - clientHeight);
    const top = maxTop * (pct / 100);
    element.scrollTo({
      top,
      left: element.scrollLeft ?? 0,
      behavior: "smooth",
    });
    return true;
  } catch {
    return false;
  }
}

const inputTypesToSetValue = new Set([
  "color",
  "date",
  "datetime-local",
  "month",
  "range",
  "time",
  "week",
]);

const inputTypesToTypeInto = new Set([
  "",
  "email",
  "number",
  "password",
  "search",
  "tel",
  "text",
  "url",
]);

export type FillElementResult =
  | { status: "done" }
  | { status: "needsinput"; value: string; reason?: string }
  | { status: "error"; reason: string };

export function prepareElementForTyping(this: Element): boolean {
  try {
    const element = this as HTMLElement;
    if (!element.isConnected) return false;

    const doc = element.ownerDocument || document;
    const win = doc.defaultView || window;

    try {
      if (typeof element.focus === "function") {
        element.focus();
      }
    } catch {
      /* ignore */
    }

    if (
      element instanceof win.HTMLInputElement ||
      element instanceof win.HTMLTextAreaElement
    ) {
      try {
        if (typeof element.select === "function") {
          element.select();
          return true;
        }
      } catch {
        /* ignore */
      }

      try {
        const length = (element.value ?? "").length;
        if (typeof element.setSelectionRange === "function") {
          element.setSelectionRange(0, length);
          return true;
        }
      } catch {
        /* ignore */
      }

      return true;
    }

    if (element.isContentEditable) {
      const selection = doc.getSelection?.();
      const range = doc.createRange?.();
      if (selection && range) {
        try {
          range.selectNodeContents(element);
          selection.removeAllRanges();
          selection.addRange(range);
        } catch {
          /* ignore */
        }
      }
      return true;
    }

    return false;
  } catch {
    return false;
  }
}

export function fillElementValue(
  this: Element,
  rawValue: string,
): FillElementResult {
  const element = this as HTMLElement;
  if (!element.isConnected) {
    return { status: "error", reason: "notconnected" };
  }

  const doc = element.ownerDocument || document;
  const win = doc.defaultView || window;
  let fallbackValue = rawValue ?? "";

  try {
    const dispatchInputAndChange = (eventValue: string): void => {
      let inputEvent: Event;
      if (typeof win.InputEvent === "function") {
        try {
          inputEvent = new win.InputEvent("input", {
            bubbles: true,
            composed: true,
            data: eventValue,
            inputType: "insertText",
          });
        } catch {
          inputEvent = new win.Event("input", {
            bubbles: true,
            composed: true,
          });
        }
      } else {
        inputEvent = new win.Event("input", { bubbles: true, composed: true });
      }

      element.dispatchEvent(inputEvent);

      const changeEvent = new win.Event("change", { bubbles: true });
      element.dispatchEvent(changeEvent);
    };

    if (element instanceof win.HTMLInputElement) {
      const type = (element.type || "").toLowerCase();

      if (!inputTypesToTypeInto.has(type) && !inputTypesToSetValue.has(type)) {
        return { status: "error", reason: `unsupported-input-type:${type}` };
      }

      let valueForTyping = rawValue;

      if (type === "number") {
        const trimmed = rawValue.trim();
        if (trimmed !== "" && Number.isNaN(Number(trimmed))) {
          return { status: "error", reason: "invalid-number-value" };
        }
        valueForTyping = trimmed;
      }

      fallbackValue = valueForTyping;

      if (inputTypesToSetValue.has(type)) {
        const trimmed = rawValue.trim();
        fallbackValue = trimmed;
        prepareElementForTyping.call(element);

        const prototype = win.HTMLInputElement.prototype;
        const descriptor = Object.getOwnPropertyDescriptor(prototype, "value");
        const nativeSetter = descriptor?.set;

        if (typeof nativeSetter === "function") {
          nativeSetter.call(element, trimmed);
        } else {
          element.value = trimmed;
        }

        const tracker = (
          element as unknown as {
            _valueTracker?: { setValue?: (next: string) => void };
          }
        )._valueTracker;
        tracker?.setValue?.(trimmed);

        if (element.value !== trimmed) {
          return { status: "error", reason: "malformed-value" };
        }

        dispatchInputAndChange(trimmed);
        return { status: "done" };
      }

      prepareElementForTyping.call(element);
      return { status: "needsinput", value: valueForTyping };
    }

    if (element instanceof win.HTMLTextAreaElement) {
      prepareElementForTyping.call(element);
      fallbackValue = rawValue;
      return { status: "needsinput", value: rawValue };
    }

    if (element instanceof win.HTMLSelectElement) {
      // Select elements use setInputFiles/selectOption instead.
      return { status: "error", reason: "unsupported-element" };
    }

    if (element.isContentEditable) {
      prepareElementForTyping.call(element);
      fallbackValue = rawValue;
      return { status: "needsinput", value: rawValue };
    }

    return { status: "error", reason: "unsupported-element" };
  } catch (error) {
    let reason = "exception";
    if (error && typeof error === "object") {
      const message = (error as { message?: unknown }).message;
      if (typeof message === "string" && message.trim().length > 0) {
        reason = `exception:${message}`;
      }
    }
    return { status: "needsinput", value: fallbackValue, reason };
  }
}

export function focusElement(this: Element): void {
  try {
    if (typeof (this as HTMLElement).focus === "function") {
      (this as HTMLElement).focus();
    }
  } catch {
    /* ignore */
  }
}

export function selectElementOptions(
  this: Element,
  rawValues: string | string[],
): string[] {
  try {
    if (!(this instanceof HTMLSelectElement)) return [];

    const desired = Array.isArray(rawValues) ? rawValues : [rawValues];
    const wanted = new Set(desired.map((v) => String(v ?? "").trim()));

    const matches = (option: HTMLOptionElement): boolean => {
      const label = (option.label || option.textContent || "").trim();
      const value = String(option.value ?? "").trim();
      return wanted.has(label) || wanted.has(value);
    };

    if (this.multiple) {
      for (const option of Array.from(this.options)) {
        option.selected = matches(option);
      }
    } else {
      let chosen = false;
      for (const option of Array.from(this.options)) {
        if (!chosen && matches(option)) {
          option.selected = true;
          this.value = option.value;
          chosen = true;
        } else {
          option.selected = false;
        }
      }
    }

    const inputEvent = new Event("input", { bubbles: true });
    const changeEvent = new Event("change", { bubbles: true });
    this.dispatchEvent(inputEvent);
    this.dispatchEvent(changeEvent);

    return Array.from(this.selectedOptions).map((opt) => opt.value);
  } catch {
    return [];
  }
}

export function isElementVisible(this: Element): boolean {
  try {
    const element = this as HTMLElement;
    if (!element.isConnected) return false;

    const style =
      element.ownerDocument?.defaultView?.getComputedStyle(element) ??
      window.getComputedStyle(element);
    if (!style) return false;
    if (style.display === "none" || style.visibility === "hidden") return false;
    const opacity = parseFloat(style.opacity ?? "1");
    if (!Number.isFinite(opacity) || opacity === 0) return false;

    const rect = element.getBoundingClientRect();
    if (!rect) return false;
    if (Math.max(rect.width, rect.height) === 0) return false;

    if (element.getClientRects().length === 0) return false;
    return true;
  } catch {
    return false;
  }
}

export function isElementChecked(this: Element): boolean {
  try {
    const element = this as HTMLElement;
    const tag = (element.tagName || "").toLowerCase();
    if (tag === "input") {
      const type = (element as HTMLInputElement).type?.toLowerCase() ?? "";
      if (type === "checkbox" || type === "radio") {
        return !!(element as HTMLInputElement).checked;
      }
    }
    const aria = element.getAttribute?.("aria-checked");
    if (aria != null) return aria === "true";
    return false;
  } catch {
    return false;
  }
}

export function readElementInputValue(this: Element): string {
  try {
    const element = this as HTMLElement;
    const tag = (element.tagName || "").toLowerCase();
    if (tag === "input" || tag === "textarea") {
      return String(
        (element as HTMLInputElement | HTMLTextAreaElement).value ?? "",
      );
    }
    if (tag === "select") {
      return String((element as HTMLSelectElement).value ?? "");
    }
    if (element.isContentEditable) {
      return String(element.textContent ?? "");
    }
    return "";
  } catch {
    return "";
  }
}

export function readElementTextContent(this: Element): string {
  try {
    return String(this.textContent ?? "");
  } catch {
    return "";
  }
}

export function readElementInnerHTML(this: Element): string {
  try {
    return String((this as HTMLElement).innerHTML ?? "");
  } catch {
    return "";
  }
}

export function readElementInnerText(this: Element): string {
  try {
    const element = this as HTMLElement;
    const inner = (element as HTMLElement & { innerText?: unknown }).innerText;
    if (typeof inner === "string" && inner.length > 0) {
      return inner;
    }
    const fallback = element.textContent;
    return typeof fallback === "string" ? fallback : "";
  } catch {
    return "";
  }
}


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/selectors.ts
================================================
import { resolveXPathAtIndex } from "./xpathResolver.js";

const parseTargetIndex = (value: unknown): number => {
  const num = Number(value ?? 0);
  if (!Number.isFinite(num) || num < 0) return 0;
  return Math.floor(num);
};

const collectCssMatches = (selector: string, limit: number): Element[] => {
  if (!selector) return [];
  const seenRoots = new WeakSet<Node>();
  const seenElements = new Set<Element>();
  const results: Element[] = [];
  const queue: Array<Document | ShadowRoot> = [document];

  const visit = (root: Document | ShadowRoot): void => {
    if (!root || seenRoots.has(root) || results.length >= limit) return;
    seenRoots.add(root);

    try {
      const matches = root.querySelectorAll(selector);
      for (const element of matches) {
        if (seenElements.has(element)) continue;
        seenElements.add(element);
        results.push(element);
        if (results.length >= limit) return;
      }
    } catch {
      // ignore querySelectorAll issues
    }

    try {
      const ownerDocument =
        root instanceof Document
          ? root
          : (root.host?.ownerDocument ?? document);
      const walker = ownerDocument.createTreeWalker(
        root,
        NodeFilter.SHOW_ELEMENT,
      );
      let node: Node | null;
      while ((node = walker.nextNode())) {
        if (!(node instanceof Element)) continue;
        const open = node.shadowRoot;
        if (open) queue.push(open);
      }
    } catch {
      // ignore traversal issues
    }
  };

  while (queue.length && results.length < limit) {
    const next = queue.shift();
    if (next) visit(next);
  }

  return results;
};

export function resolveCssSelector(
  selectorRaw: string,
  targetIndexRaw?: number,
): Element | null {
  const selector = String(selectorRaw ?? "").trim();
  if (!selector) return null;

  const targetIndex = parseTargetIndex(targetIndexRaw);
  const matches = collectCssMatches(selector, targetIndex + 1);
  return matches[targetIndex] ?? null;
}

export function resolveCssSelectorPierce(
  selectorRaw: string,
  targetIndexRaw?: number,
): Element | null {
  const selector = String(selectorRaw ?? "").trim();
  if (!selector) return null;

  const targetIndex = parseTargetIndex(targetIndexRaw);
  const backdoor = window.__stagehandV3__;
  if (!backdoor || typeof backdoor.getClosedRoot !== "function") {
    const matches = collectCssMatches(selector, targetIndex + 1);
    return matches[targetIndex] ?? null;
  }

  const getClosedRoot: (host: Element) => ShadowRoot | null = (
    host: Element,
  ) => {
    try {
      return backdoor.getClosedRoot(host) ?? null;
    } catch {
      return null;
    }
  };

  const seenRoots = new WeakSet<Node>();
  const seenElements = new Set<Element>();
  const results: Element[] = [];
  const queue: Array<Document | ShadowRoot> = [document];

  const visit = (root: Document | ShadowRoot): void => {
    if (!root || seenRoots.has(root) || results.length >= targetIndex + 1)
      return;
    seenRoots.add(root);

    try {
      const matches = root.querySelectorAll(selector);
      for (const element of matches) {
        if (seenElements.has(element)) continue;
        seenElements.add(element);
        results.push(element);
        if (results.length >= targetIndex + 1) return;
      }
    } catch {
      // ignore query errors
    }

    try {
      const ownerDocument =
        root instanceof Document
          ? root
          : (root.host?.ownerDocument ?? document);
      const walker = ownerDocument.createTreeWalker(
        root,
        NodeFilter.SHOW_ELEMENT,
      );
      let node: Node | null;
      while ((node = walker.nextNode())) {
        if (!(node instanceof Element)) continue;
        const open = node.shadowRoot;
        if (open) queue.push(open);
        const closed = getClosedRoot(node);
        if (closed) queue.push(closed);
      }
    } catch {
      // ignore traversal issues
    }
  };

  while (queue.length && results.length < targetIndex + 1) {
    const next = queue.shift();
    if (next) visit(next);
  }

  return results[targetIndex] ?? null;
}

export function resolveTextSelector(
  rawNeedle: string,
  targetIndexRaw?: number,
): Element | null {
  const needle = String(rawNeedle ?? "");
  if (!needle) return null;
  const needleLc = needle.toLowerCase();
  const targetIndex = parseTargetIndex(targetIndexRaw);

  const skipTags = new Set([
    "SCRIPT",
    "STYLE",
    "TEMPLATE",
    "NOSCRIPT",
    "HEAD",
    "TITLE",
    "LINK",
    "META",
    "HTML",
    "BODY",
  ]);

  const shouldSkip = (node: Element | null | undefined): boolean => {
    if (!node) return false;
    const tag = node.tagName?.toUpperCase() ?? "";
    return skipTags.has(tag);
  };

  const extractText = (node: Element): string => {
    try {
      if (shouldSkip(node)) return "";
      const inner = (node as HTMLElement).innerText;
      if (typeof inner === "string" && inner.trim()) return inner.trim();
    } catch {
      // ignore
    }
    try {
      const text = node.textContent;
      if (typeof text === "string") return text.trim();
    } catch {
      // ignore
    }
    return "";
  };

  const matches = (node: Element): boolean => {
    const text = extractText(node);
    return !!text && text.toLowerCase().includes(needleLc);
  };

  const backdoor = window.__stagehandV3__;
  const getClosedRoot: (host: Element) => ShadowRoot | null =
    backdoor && typeof backdoor.getClosedRoot === "function"
      ? (host: Element): ShadowRoot | null => {
          try {
            return backdoor.getClosedRoot(host) ?? null;
          } catch {
            return null;
          }
        }
      : (host: Element): ShadowRoot | null => {
          void host;
          return null;
        };

  const seen = new WeakSet<Node>();
  const queue: Node[] = [];
  const matchesList: Array<{
    element: Element;
    tag: string;
    id: string;
    className: string;
    text: string;
  }> = [];

  const enqueue = (node: Node | null | undefined) => {
    if (!node || seen.has(node)) return;
    seen.add(node);
    queue.push(node);
  };

  const walkerFor = (root: Node): TreeWalker | null => {
    try {
      const doc =
        root instanceof Document
          ? root
          : ((root as Element)?.ownerDocument ?? document);
      return doc.createTreeWalker(root, NodeFilter.SHOW_ELEMENT);
    } catch {
      return null;
    }
  };

  enqueue(document);

  while (queue.length) {
    const root = queue.shift();
    if (!root) continue;

    if (root instanceof Element && matches(root)) {
      matchesList.push({
        element: root,
        tag: root.tagName ?? "",
        id: root.id ?? "",
        className: (root as HTMLElement).className ?? "",
        text: extractText(root),
      });
    }

    const walker = walkerFor(root);
    if (!walker) continue;

    let node: Node | null;
    while ((node = walker.nextNode())) {
      if (!(node instanceof Element)) continue;

      if (matches(node)) {
        matchesList.push({
          element: node,
          tag: node.tagName ?? "",
          id: node.id ?? "",
          className: (node as HTMLElement).className ?? "",
          text: extractText(node),
        });
      }

      const open = node.shadowRoot;
      if (open) enqueue(open);

      const closed = getClosedRoot(node);
      if (closed) enqueue(closed);
    }
  }

  const innermost: typeof matchesList = [];
  for (const item of matchesList) {
    const el = item.element;
    let skip = false;
    for (const other of matchesList) {
      if (item === other) continue;
      try {
        if (el.contains(other.element)) {
          skip = true;
          break;
        }
      } catch {
        // ignore containment errors
      }
    }
    if (!skip) {
      innermost.push(item);
    }
  }

  const target = innermost[targetIndex];
  return target?.element ?? null;
}

export function resolveXPathMainWorld(
  rawXp: string,
  targetIndexRaw?: number,
): Element | null {
  const targetIndex = parseTargetIndex(targetIndexRaw);
  return resolveXPathAtIndex(rawXp, targetIndex, { pierceShadow: true });
}


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/waitForSelector.ts
================================================
/**
 * waitForSelector - Waits for an element matching a selector to reach a specific state.
 * Supports both CSS selectors and XPath expressions.
 * Uses MutationObserver for efficiency and integrates with the V3 piercer for closed shadow roots.
 *
 * NOTE: This function runs inside the page context. Keep it dependency-free
 * and resilient to exceptions.
 */

import { resolveXPathFirst } from "./xpathResolver.js";

type WaitForSelectorState = "attached" | "detached" | "visible" | "hidden";

/**
 * Check if a selector is an XPath expression.
 */
const isXPath = (selector: string): boolean => {
  return selector.startsWith("xpath=") || selector.startsWith("/");
};

/**
 * Get closed shadow root via the V3 piercer if available.
 */
const getClosedRoot = (element: Element): ShadowRoot | null => {
  try {
    const backdoor = window.__stagehandV3__;
    if (backdoor && typeof backdoor.getClosedRoot === "function") {
      return backdoor.getClosedRoot(element) ?? null;
    }
  } catch {
    // ignore
  }
  return null;
};

/**
 * Get shadow root (open or closed via piercer).
 */
const getShadowRoot = (element: Element): ShadowRoot | null => {
  // First try open shadow root
  if (element.shadowRoot) return element.shadowRoot;
  // Then try closed shadow root via piercer
  return getClosedRoot(element);
};

/**
 * Deep querySelector that pierces shadow DOM (both open and closed via piercer).
 */
const deepQuerySelector = (
  root: Document | ShadowRoot,
  selector: string,
  pierceShadow: boolean,
): Element | null => {
  // Try regular querySelector first
  try {
    const el = root.querySelector(selector);
    if (el) return el;
  } catch {
    // ignore query errors
  }

  if (!pierceShadow) return null;

  // BFS queue to search all shadow roots (open and closed)
  const seenRoots = new WeakSet<Node>();
  const queue: Array<Document | ShadowRoot> = [root];

  while (queue.length > 0) {
    const currentRoot = queue.shift();
    if (!currentRoot || seenRoots.has(currentRoot)) continue;
    seenRoots.add(currentRoot);

    // Try querySelector on this root
    try {
      const found = currentRoot.querySelector(selector);
      if (found) return found;
    } catch {
      // ignore query errors
    }

    // Walk all elements in this root to find shadow hosts
    try {
      const ownerDoc =
        currentRoot instanceof Document
          ? currentRoot
          : (currentRoot.host?.ownerDocument ?? document);
      const walker = ownerDoc.createTreeWalker(
        currentRoot,
        NodeFilter.SHOW_ELEMENT,
      );
      let node: Node | null;
      while ((node = walker.nextNode())) {
        if (!(node instanceof Element)) continue;
        const shadowRoot = getShadowRoot(node);
        if (shadowRoot && !seenRoots.has(shadowRoot)) {
          queue.push(shadowRoot);
        }
      }
    } catch {
      // ignore traversal errors
    }
  }

  return null;
};

/**
 * Resolve XPath with shadow DOM piercing support.
 */
const deepXPathQuery = (
  xpath: string,
  pierceShadow: boolean,
): Element | null => {
  return resolveXPathFirst(xpath, { pierceShadow });
};

/**
 * Find element by selector (CSS or XPath) with optional shadow DOM piercing.
 */
const findElement = (
  selector: string,
  pierceShadow: boolean,
): Element | null => {
  if (isXPath(selector)) {
    return deepXPathQuery(selector, pierceShadow);
  }
  return deepQuerySelector(document, selector, pierceShadow);
};

/**
 * Check if element matches the desired state.
 */
const checkState = (
  el: Element | null,
  state: WaitForSelectorState,
): boolean => {
  if (state === "detached") return el === null;
  if (state === "attached") return el !== null;
  if (el === null) return false;

  if (state === "hidden") {
    try {
      const style = window.getComputedStyle(el);
      const rect = el.getBoundingClientRect();
      return (
        style.display === "none" ||
        style.visibility === "hidden" ||
        style.opacity === "0" ||
        rect.width === 0 ||
        rect.height === 0
      );
    } catch {
      return false;
    }
  }

  // state === "visible"
  try {
    const style = window.getComputedStyle(el);
    const rect = el.getBoundingClientRect();
    return (
      style.display !== "none" &&
      style.visibility !== "hidden" &&
      style.opacity !== "0" &&
      rect.width > 0 &&
      rect.height > 0
    );
  } catch {
    return false;
  }
};

/**
 * Set up MutationObservers on all shadow roots to detect changes.
 */
const setupShadowObservers = (
  callback: () => void,
  observers: MutationObserver[],
): void => {
  const seenRoots = new WeakSet<Node>();

  const observeShadowRoots = (node: Element): void => {
    const shadowRoot = getShadowRoot(node);
    if (shadowRoot && !seenRoots.has(shadowRoot)) {
      seenRoots.add(shadowRoot);
      const shadowObserver = new MutationObserver(callback);
      shadowObserver.observe(shadowRoot, {
        childList: true,
        subtree: true,
        attributes: true,
        attributeFilter: ["style", "class", "hidden", "disabled"],
      });
      observers.push(shadowObserver);

      // Recurse into shadow root children
      for (const child of Array.from(shadowRoot.children)) {
        observeShadowRoots(child);
      }
    }

    // Recurse into regular children
    for (const child of Array.from(node.children)) {
      observeShadowRoots(child);
    }
  };

  const root = document.documentElement || document.body;
  if (root) {
    observeShadowRoots(root);
  }
};

/**
 * Wait for an element matching the selector to reach the specified state.
 * Supports both CSS selectors and XPath expressions (prefix with "xpath=" or start with "/").
 *
 * @param selectorRaw - CSS selector or XPath expression to wait for
 * @param stateRaw - Element state: 'attached' | 'detached' | 'visible' | 'hidden'
 * @param timeoutRaw - Maximum time to wait in milliseconds
 * @param pierceShadowRaw - Whether to search inside shadow DOM
 * @returns Promise that resolves to true when condition is met, or rejects on timeout
 */
export function waitForSelector(
  selectorRaw: string,
  stateRaw?: string,
  timeoutRaw?: number,
  pierceShadowRaw?: boolean,
): Promise<boolean> {
  const selector = String(selectorRaw ?? "").trim();
  const state =
    (String(stateRaw ?? "visible") as WaitForSelectorState) || "visible";
  const timeout =
    typeof timeoutRaw === "number" && timeoutRaw > 0 ? timeoutRaw : 30000;
  const pierceShadow = pierceShadowRaw !== false;

  return new Promise<boolean>((resolve, reject) => {
    let timeoutId: ReturnType<typeof setTimeout> | null = null;
    let domReadyHandler: (() => void) | null = null;
    let settled = false;
    const clearTimer = (): void => {
      if (timeoutId !== null) {
        clearTimeout(timeoutId);
        timeoutId = null;
      }
    };

    // Check immediately
    const el = findElement(selector, pierceShadow);
    if (checkState(el, state)) {
      settled = true;
      resolve(true);
      return;
    }

    const observers: MutationObserver[] = [];

    const cleanup = (): void => {
      for (const obs of observers) {
        obs.disconnect();
      }
      if (domReadyHandler) {
        document.removeEventListener("DOMContentLoaded", domReadyHandler);
        domReadyHandler = null;
      }
    };

    const check = (): void => {
      if (settled) return;
      const el = findElement(selector, pierceShadow);
      if (checkState(el, state)) {
        settled = true;
        clearTimer();
        cleanup();
        resolve(true);
      }
    };

    // Handle case where document.body is not ready yet
    const observeRoot = document.body || document.documentElement;
    if (!observeRoot) {
      domReadyHandler = (): void => {
        document.removeEventListener("DOMContentLoaded", domReadyHandler!);
        domReadyHandler = null;
        check();
        setupObservers();
      };
      document.addEventListener("DOMContentLoaded", domReadyHandler);
      timeoutId = setTimeout(() => {
        if (settled) return;
        settled = true;
        clearTimer();
        cleanup();
        reject(
          new Error(
            `waitForSelector: Timeout ${timeout}ms exceeded waiting for "${selector}" to be ${state}`,
          ),
        );
      }, timeout);
      return;
    }

    const setupObservers = (): void => {
      const root = document.body || document.documentElement;
      if (!root) return;

      // Main document observer
      const mainObserver = new MutationObserver(check);
      mainObserver.observe(root, {
        childList: true,
        subtree: true,
        attributes: true,
        attributeFilter: ["style", "class", "hidden", "disabled"],
      });
      observers.push(mainObserver);

      // Shadow DOM observers (if piercing)
      if (pierceShadow) {
        setupShadowObservers(check, observers);
      }
    };

    setupObservers();

    // Set up timeout
    timeoutId = setTimeout(() => {
      if (settled) return;
      settled = true;
      clearTimer();
      cleanup();
      reject(
        new Error(
          `waitForSelector: Timeout ${timeout}ms exceeded waiting for "${selector}" to be ${state}`,
        ),
      );
    }, timeout);
  });
}


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/xpathParser.ts
================================================
export type XPathPredicate =
  | { type: "index"; index: number }
  | { type: "attrEquals"; name: string; value: string; normalize?: boolean }
  | { type: "attrExists"; name: string }
  | {
      type: "attrContains";
      name: string;
      value: string;
      normalize?: boolean;
    }
  | {
      type: "attrStartsWith";
      name: string;
      value: string;
      normalize?: boolean;
    }
  | { type: "textEquals"; value: string; normalize?: boolean }
  | { type: "textContains"; value: string; normalize?: boolean }
  | { type: "and"; predicates: XPathPredicate[] }
  | { type: "or"; predicates: XPathPredicate[] }
  | { type: "not"; predicate: XPathPredicate };

export interface XPathStep {
  axis: "child" | "desc";
  tag: string;
  predicates: XPathPredicate[];
}

/**
 * Parse an XPath expression into a list of traversal steps.
 *
 * This is a subset parser designed for composed DOM traversal (including
 * shadow roots). It intentionally does not implement the full XPath spec.
 *
 * Supported:
 *  - Child (`/`) and descendant (`//`) axes
 *  - Tag names and wildcard (`*`)
 *  - Positional indices (`[n]`)
 *  - Attribute equality predicates (`[@attr='value']`, `[@attr="value"]`)
 *  - Attribute existence (`[@attr]`)
 *  - Attribute contains/starts-with (`contains(@attr,'v')`, `starts-with(@attr,'v')`)
 *  - Text equality/contains (`[text()='v']`, `[contains(text(),'v')]`, `[.='v']`)
 *  - normalize-space on text/attributes (`[normalize-space(text())='v']`)
 *  - Basic boolean predicates (`and`, `or`, `not(...)`)
 *  - Multiple predicates per step (`[@class='foo'][2]`)
 *  - Optional `xpath=` prefix
 *
 * Not supported:
 *  - Position functions (`[position() > n]`, `[last()]`)
 *  - Axes beyond child/descendant (`ancestor::`, `parent::`, `self::`,
 *    `preceding-sibling::`, `following-sibling::`)
 *  - Union operator (`|`)
 *  - Grouped expressions (`(//div)[n]`)
 *
 * Unsupported predicates are silently ignored — the step still matches
 * by tag name, but the unrecognized predicate has no filtering effect.
 */
export function parseXPathSteps(input: string): XPathStep[] {
  const path = String(input || "")
    .trim()
    .replace(/^xpath=/i, "");
  if (!path) return [];

  const steps: XPathStep[] = [];
  let i = 0;

  while (i < path.length) {
    let axis: "child" | "desc" = "child";
    if (path.startsWith("//", i)) {
      axis = "desc";
      i += 2;
    } else if (path[i] === "/") {
      axis = "child";
      i += 1;
    }

    const start = i;
    let bracketDepth = 0;
    let quote: string | null = null;
    while (i < path.length) {
      const ch = path[i];
      if (quote) {
        if (ch === quote) quote = null;
      } else if (ch === "'" || ch === '"') {
        quote = ch;
      } else if (ch === "[") {
        bracketDepth++;
      } else if (ch === "]") {
        bracketDepth--;
      } else if (ch === "/" && bracketDepth === 0) {
        break;
      }
      i += 1;
    }
    const rawStep = path.slice(start, i).trim();
    if (!rawStep) continue;

    const { tag, predicates } = parseStep(rawStep);
    steps.push({ axis, tag, predicates });
  }

  return steps;
}

/**
 * Extract predicate contents from a string like `[@attr='val'][2]`.
 * Handles `]` inside quoted attribute values (e.g. `[@title='a[0]']`).
 */
function extractPredicates(str: string): string[] {
  const results: string[] = [];
  let i = 0;
  while (i < str.length) {
    if (str[i] !== "[") {
      i++;
      continue;
    }
    i++; // skip opening [
    const start = i;
    let quote: string | null = null;
    while (i < str.length) {
      const ch = str[i];
      if (quote) {
        if (ch === quote) quote = null;
      } else if (ch === "'" || ch === '"') {
        quote = ch;
      } else if (ch === "]") {
        break;
      }
      i++;
    }
    results.push(str.slice(start, i).trim());
    i++; // skip closing ]
  }
  return results;
}

function parseStep(raw: string): {
  tag: string;
  predicates: XPathPredicate[];
} {
  const bracketPos = raw.indexOf("[");
  if (bracketPos === -1) {
    const tag = raw === "" ? "*" : raw.toLowerCase();
    return { tag, predicates: [] };
  }

  const tagPart = raw.slice(0, bracketPos).trim();
  const tag = tagPart === "" ? "*" : tagPart.toLowerCase();
  const predicateStr = raw.slice(bracketPos);

  const predicates: XPathPredicate[] = [];

  for (const inner of extractPredicates(predicateStr)) {
    const parsed = parsePredicateExpression(inner);
    if (parsed) predicates.push(parsed);
  }

  return { tag, predicates };
}

function parsePredicateExpression(input: string): XPathPredicate | null {
  const trimmed = input.trim();
  if (!trimmed) return null;

  const orParts = splitTopLevel(trimmed, "or");
  if (orParts.length > 1) {
    const preds = orParts
      .map((part) => parsePredicateExpression(part))
      .filter(Boolean) as XPathPredicate[];
    if (preds.length !== orParts.length) return null;
    return { type: "or", predicates: preds };
  }

  const andParts = splitTopLevel(trimmed, "and");
  if (andParts.length > 1) {
    const preds = andParts
      .map((part) => parsePredicateExpression(part))
      .filter(Boolean) as XPathPredicate[];
    if (preds.length !== andParts.length) return null;
    return { type: "and", predicates: preds };
  }

  const notInner = unwrapFunctionCall(trimmed, "not");
  if (notInner != null) {
    const predicate = parsePredicateExpression(notInner);
    return predicate ? { type: "not", predicate } : null;
  }

  return parseAtomicPredicate(trimmed);
}

function parseAtomicPredicate(input: string): XPathPredicate | null {
  const valueMatch = /^(?:'([^']*)'|"([^"]*)")$/;
  const attrName = "[a-zA-Z_][\\w.-]*";
  const quoted = "(?:'([^']*)'|\"([^\"]*)\")";

  if (/^\d+$/.test(input)) {
    return { type: "index", index: Math.max(1, Number(input)) };
  }

  const normalizeAttrMatch = input.match(
    new RegExp(
      `^normalize-space\\(\\s*@(${attrName})\\s*\\)\\s*=\\s*${quoted}$`,
    ),
  );
  if (normalizeAttrMatch) {
    return {
      type: "attrEquals",
      name: normalizeAttrMatch[1],
      value: normalizeAttrMatch[2] ?? normalizeAttrMatch[3] ?? "",
      normalize: true,
    };
  }

  const normalizeTextMatch = input.match(
    new RegExp(
      `^normalize-space\\(\\s*(?:text\\(\\)|\\.)\\s*\\)\\s*=\\s*${quoted}$`,
    ),
  );
  if (normalizeTextMatch) {
    return {
      type: "textEquals",
      value: normalizeTextMatch[1] ?? normalizeTextMatch[2] ?? "",
      normalize: true,
    };
  }

  const attrEqualsMatch = input.match(
    new RegExp(`^@(${attrName})\\s*=\\s*${quoted}$`),
  );
  if (attrEqualsMatch) {
    return {
      type: "attrEquals",
      name: attrEqualsMatch[1],
      value: attrEqualsMatch[2] ?? attrEqualsMatch[3] ?? "",
    };
  }

  const attrExistsMatch = input.match(new RegExp(`^@(${attrName})$`));
  if (attrExistsMatch) {
    return { type: "attrExists", name: attrExistsMatch[1] };
  }

  const attrContainsMatch = input.match(
    new RegExp(`^contains\\(\\s*@(${attrName})\\s*,\\s*${quoted}\\s*\\)$`),
  );
  if (attrContainsMatch) {
    return {
      type: "attrContains",
      name: attrContainsMatch[1],
      value: attrContainsMatch[2] ?? attrContainsMatch[3] ?? "",
    };
  }

  const attrStartsMatch = input.match(
    new RegExp(`^starts-with\\(\\s*@(${attrName})\\s*,\\s*${quoted}\\s*\\)$`),
  );
  if (attrStartsMatch) {
    return {
      type: "attrStartsWith",
      name: attrStartsMatch[1],
      value: attrStartsMatch[2] ?? attrStartsMatch[3] ?? "",
    };
  }

  const textEqualsMatch = input.match(
    new RegExp(`^(?:text\\(\\)|\\.)\\s*=\\s*${quoted}$`),
  );
  if (textEqualsMatch) {
    return {
      type: "textEquals",
      value: textEqualsMatch[1] ?? textEqualsMatch[2] ?? "",
    };
  }

  const textContainsMatch = input.match(
    new RegExp(`^contains\\(\\s*(?:text\\(\\)|\\.)\\s*,\\s*${quoted}\\s*\\)$`),
  );
  if (textContainsMatch) {
    return {
      type: "textContains",
      value: textContainsMatch[1] ?? textContainsMatch[2] ?? "",
    };
  }

  if (valueMatch.test(input)) {
    return null;
  }

  return null;
}

function splitTopLevel(input: string, keyword: string): string[] {
  const parts: string[] = [];
  let start = 0;
  let depth = 0;
  let quote: string | null = null;
  let i = 0;

  while (i < input.length) {
    const ch = input[i];
    if (quote) {
      if (ch === quote) quote = null;
      i += 1;
      continue;
    }

    if (ch === "'" || ch === '"') {
      quote = ch;
      i += 1;
      continue;
    }

    if (ch === "(") {
      depth += 1;
      i += 1;
      continue;
    }

    if (ch === ")") {
      depth = Math.max(0, depth - 1);
      i += 1;
      continue;
    }

    if (depth === 0 && isKeywordAt(input, i, keyword)) {
      parts.push(input.slice(start, i).trim());
      i += keyword.length;
      start = i;
      continue;
    }

    i += 1;
  }

  parts.push(input.slice(start).trim());
  return parts.filter((part) => part.length > 0);
}

function isKeywordAt(input: string, index: number, keyword: string): boolean {
  if (!input.startsWith(keyword, index)) return false;
  const before = index > 0 ? input[index - 1] : " ";
  if (before === "@") return false;
  const after =
    index + keyword.length < input.length ? input[index + keyword.length] : " ";
  return isBoundary(before) && isBoundary(after);
}

function isBoundary(ch: string): boolean {
  return !/[a-zA-Z0-9_.-]/.test(ch);
}

function unwrapFunctionCall(input: string, name: string): string | null {
  const prefix = `${name}(`;
  if (!input.startsWith(prefix) || !input.endsWith(")")) return null;
  const inner = input.slice(prefix.length, -1);
  return hasBalancedParens(inner) ? inner : null;
}

function hasBalancedParens(input: string): boolean {
  let depth = 0;
  let quote: string | null = null;
  for (let i = 0; i < input.length; i += 1) {
    const ch = input[i];
    if (quote) {
      if (ch === quote) quote = null;
      continue;
    }
    if (ch === "'" || ch === '"') {
      quote = ch;
      continue;
    }
    if (ch === "(") depth += 1;
    else if (ch === ")") depth -= 1;
    if (depth < 0) return false;
  }
  return depth === 0;
}

const normalizeSpace = (value: string): string =>
  value.replace(/\s+/g, " ").trim();

function textValue(element: Element): string {
  return String(element.textContent ?? "");
}

function normalizeMaybe(value: string, normalize?: boolean): string {
  return normalize ? normalizeSpace(value) : value;
}

export function evaluatePredicate(
  element: Element,
  predicate: XPathPredicate,
): boolean {
  switch (predicate.type) {
    case "and":
      return predicate.predicates.every((p) => evaluatePredicate(element, p));
    case "or":
      return predicate.predicates.some((p) => evaluatePredicate(element, p));
    case "not":
      return !evaluatePredicate(element, predicate.predicate);
    case "attrExists":
      return element.getAttribute(predicate.name) !== null;
    case "attrEquals": {
      const attr = element.getAttribute(predicate.name);
      if (attr === null) return false;
      return (
        normalizeMaybe(attr, predicate.normalize) ===
        normalizeMaybe(predicate.value, predicate.normalize)
      );
    }
    case "attrContains": {
      const attr = element.getAttribute(predicate.name);
      if (attr === null) return false;
      return normalizeMaybe(attr, predicate.normalize).includes(
        normalizeMaybe(predicate.value, predicate.normalize),
      );
    }
    case "attrStartsWith": {
      const attr = element.getAttribute(predicate.name);
      if (attr === null) return false;
      return normalizeMaybe(attr, predicate.normalize).startsWith(
        normalizeMaybe(predicate.value, predicate.normalize),
      );
    }
    case "textEquals": {
      const value = normalizeMaybe(textValue(element), predicate.normalize);
      return value === normalizeMaybe(predicate.value, predicate.normalize);
    }
    case "textContains": {
      const value = normalizeMaybe(textValue(element), predicate.normalize);
      return value.includes(
        normalizeMaybe(predicate.value, predicate.normalize),
      );
    }
    case "index":
      return true;
    default:
      return true;
  }
}

export function applyPredicates(
  elements: Element[],
  predicates: XPathPredicate[],
): Element[] {
  let current = elements;
  for (const predicate of predicates) {
    if (!current.length) return [];

    if (predicate.type === "index") {
      const idx = predicate.index - 1;
      current = idx >= 0 && idx < current.length ? [current[idx]!] : [];
      continue;
    }

    current = current.filter((el) => evaluatePredicate(el, predicate));
  }
  return current;
}


================================================
FILE: packages/core/lib/v3/dom/locatorScripts/xpathResolver.ts
================================================
import {
  applyPredicates,
  parseXPathSteps,
  type XPathStep,
} from "./xpathParser.js";

type ClosedRootGetter = (host: Element) => ShadowRoot | null;

export type XPathResolveOptions = {
  pierceShadow?: boolean;
};

type ShadowContext = {
  getClosedRoot: ClosedRootGetter | null;
  hasShadow: boolean;
};

const normalizeXPath = (selector: string): string => {
  const raw = String(selector ?? "").trim();
  if (!raw) return "";
  return raw.replace(/^xpath=/i, "").trim();
};

export function resolveXPathFirst(
  rawXp: string,
  options?: XPathResolveOptions,
): Element | null {
  return resolveXPathAtIndex(rawXp, 0, options);
}

export function resolveXPathAtIndex(
  rawXp: string,
  index: number,
  options?: XPathResolveOptions,
): Element | null {
  if (!Number.isFinite(index) || index < 0) return null;
  const xp = normalizeXPath(rawXp);
  if (!xp) return null;

  const targetIndex = Math.floor(index);
  const pierceShadow = options?.pierceShadow !== false;
  const shadowCtx = pierceShadow ? getShadowContext() : null;

  if (!pierceShadow) {
    return resolveNativeAtIndexWithError(xp, targetIndex).value;
  }

  if (!shadowCtx?.hasShadow) {
    const native = resolveNativeAtIndexWithError(xp, targetIndex);
    if (!native.error) return native.value;
    const composed = resolveXPathComposedMatches(xp, shadowCtx?.getClosedRoot);
    return composed[targetIndex] ?? null;
  }

  const composed = resolveXPathComposedMatches(xp, shadowCtx.getClosedRoot);
  return composed[targetIndex] ?? null;
}

export function countXPathMatches(
  rawXp: string,
  options?: XPathResolveOptions,
): number {
  const xp = normalizeXPath(rawXp);
  if (!xp) return 0;

  const pierceShadow = options?.pierceShadow !== false;
  const shadowCtx = pierceShadow ? getShadowContext() : null;

  if (!pierceShadow) {
    return resolveNativeCountWithError(xp).count;
  }

  if (!shadowCtx?.hasShadow) {
    const count = resolveNativeCountWithError(xp);
    if (!count.error) return count.count;
    return resolveXPathComposedMatches(xp, shadowCtx?.getClosedRoot).length;
  }

  return resolveXPathComposedMatches(xp, shadowCtx.getClosedRoot).length;
}

export function resolveXPathComposedMatches(
  rawXp: string,
  getClosedRoot?: ClosedRootGetter | null,
): Element[] {
  const xp = normalizeXPath(rawXp);
  if (!xp) return [];

  const steps = parseXPathSteps(xp);
  if (!steps.length) return [];

  const closedRoot = getClosedRoot ?? null;

  let current: Array<Document | Element | ShadowRoot | DocumentFragment> = [
    document,
  ];

  for (const step of steps) {
    const next: Element[] = [];
    const seen = new Set<Element>();

    for (const root of current) {
      if (!root) continue;
      const pool =
        step.axis === "child"
          ? composedChildren(root, closedRoot)
          : composedDescendants(root, closedRoot);
      if (!pool.length) continue;

      const tagMatches = pool.filter((candidate) =>
        matchesTag(candidate, step),
      );
      const matches = applyPredicates(tagMatches, step.predicates);

      for (const candidate of matches) {
        if (!seen.has(candidate)) {
          seen.add(candidate);
          next.push(candidate);
        }
      }
    }

    if (!next.length) return [];
    current = next;
  }

  return current as Element[];
}

function matchesTag(element: Element, step: XPathStep): boolean {
  if (step.tag === "*") return true;
  return element.localName === step.tag;
}

function getShadowContext(): ShadowContext {
  const backdoor = window.__stagehandV3__;
  const getClosedRoot: ClosedRootGetter | null =
    backdoor && typeof backdoor.getClosedRoot === "function"
      ? (host: Element): ShadowRoot | null => {
          try {
            return backdoor.getClosedRoot(host) ?? null;
          } catch {
            return null;
          }
        }
      : null;

  let hasShadow = false;
  try {
    if (backdoor && typeof backdoor.stats === "function") {
      const stats = backdoor.stats();
      hasShadow = (stats?.open ?? 0) > 0 || (stats?.closed ?? 0) > 0;
    }
  } catch {
    // ignore stats errors
  }

  if (!hasShadow) {
    try {
      const walker = document.createTreeWalker(
        document,
        NodeFilter.SHOW_ELEMENT,
      );
      while (walker.nextNode()) {
        const el = walker.currentNode as Element;
        if (el.shadowRoot) {
          hasShadow = true;
          break;
        }
      }
    } catch {
      // ignore scan errors
    }
  }

  return { getClosedRoot, hasShadow };
}

function composedChildren(
  node: Node | null | undefined,
  getClosedRoot: ClosedRootGetter | null,
): Element[] {
  const out: Element[] = [];
  if (!node) return out;

  if (node instanceof Document) {
    if (node.documentElement) out.push(node.documentElement);
    return out;
  }

  if (node instanceof ShadowRoot || node instanceof DocumentFragment) {
    out.push(...Array.from(node.children ?? []));
    return out;
  }

  if (node instanceof Element) {
    out.push(...Array.from(node.children ?? []));
    const open = node.shadowRoot;
    if (open) out.push(...Array.from(open.children ?? []));
    if (getClosedRoot) {
      const closed = getClosedRoot(node);
      if (closed) out.push(...Array.from(closed.children ?? []));
    }
    return out;
  }

  return out;
}

function composedDescendants(
  node: Node | null | undefined,
  getClosedRoot: ClosedRootGetter | null,
): Element[] {
  const out: Element[] = [];
  const seen = new Set<Element>();
  const stack = [...composedChildren(node, getClosedRoot)].reverse();

  while (stack.length) {
    const next = stack.pop();
    if (!next || seen.has(next)) continue;
    seen.add(next);
    out.push(next);

    const children = composedChildren(next, getClosedRoot);
    for (let i = children.length - 1; i >= 0; i -= 1) {
      stack.push(children[i]!);
    }
  }

  return out;
}

function resolveNativeAtIndexWithError(
  xp: string,
  index: number,
): { value: Element | null; error: boolean } {
  try {
    const snapshot = document.evaluate(
      xp,
      document,
      null,
      XPathResult.ORDERED_NODE_SNAPSHOT_TYPE,
      null,
    );
    return {
      value: snapshot.snapshotItem(index) as Element | null,
      error: false,
    };
  } catch {
    return { value: null, error: true };
  }
}

function resolveNativeCountWithError(xp: string): {
  count: number;
  error: boolean;
} {
  try {
    const snapshot = document.evaluate(
      xp,
      document,
      null,
      XPathResult.ORDERED_NODE_SNAPSHOT_TYPE,
      null,
    );
    return { count: snapshot.snapshotLength, error: false };
  } catch {
    return { count: 0, error: true };
  }
}


================================================
FILE: packages/core/lib/v3/dom/piercer.entry.ts
================================================
import { installV3ShadowPiercer } from "./piercer.runtime.js";

installV3ShadowPiercer({ debug: true, tagExisting: false });


================================================
FILE: packages/core/lib/v3/dom/piercer.runtime.ts
================================================
export interface V3ShadowPatchOptions {
  debug?: boolean;
  tagExisting?: boolean;
}

export interface StagehandV3Backdoor {
  /** Closed shadow-root accessors */
  getClosedRoot(host: Element): ShadowRoot | undefined;
  /** Stats + quick health check */
  stats(): {
    installed: true;
    url: string;
    isTop: boolean;
    open: number;
    closed: number;
  };
}

type V3InternalState = {
  hostToRoot: WeakMap<Element, ShadowRoot>;
  openCount: number;
  closedCount: number;
  debug: boolean;
};

declare global {
  interface Window {
    __stagehandV3Injected?: boolean;
    __stagehandV3__?: StagehandV3Backdoor;
  }
}

export function installV3ShadowPiercer(opts: V3ShadowPatchOptions = {}): void {
  // hardcoded debug (remove later if desired)
  const DEBUG = true;

  type PatchedFn = Element["attachShadow"] & {
    __v3Patched?: boolean;
    __v3State?: V3InternalState;
  };

  const bindBackdoor = (state: V3InternalState): void => {
    const { hostToRoot } = state;

    window.__stagehandV3__ = {
      getClosedRoot: (host: Element) => hostToRoot.get(host),
      stats: () => ({
        installed: true,
        url: location.href,
        isTop: window.top === window,
        open: state.openCount,
        closed: state.closedCount,
      }),
    } satisfies StagehandV3Backdoor;
  };

  // Look at the *current* function on the prototype. If it's already our patched
  // function, reuse its shared state and rebind the backdoor (no new WeakMap).
  const currentFn = Element.prototype.attachShadow as PatchedFn;
  if (currentFn.__v3Patched && currentFn.__v3State) {
    currentFn.__v3State.debug = DEBUG; // keep debug toggle consistent
    bindBackdoor(currentFn.__v3State);
    // idempotent: do not log "installed" again
    return;
  }

  // First-time install: create shared state and replace the prototype method
  const state: V3InternalState = {
    hostToRoot: new WeakMap<Element, ShadowRoot>(),
    openCount: 0,
    closedCount: 0,
    debug: DEBUG,
  };

  const original = currentFn; // keep a reference to call through
  const patched: PatchedFn = function (
    this: Element,
    init: ShadowRootInit,
  ): ShadowRoot {
    const mode = init?.mode ?? "open";
    const root = original.call(this, init);
    try {
      state.hostToRoot.set(this, root);
      if (mode === "closed") state.closedCount++;
      else state.openCount++;
      if (state.debug) {
        console.info("[v3-piercer] attachShadow", {
          tag: (this as Element).tagName?.toLowerCase() ?? "",
          mode,
          url: location.href,
        });
      }
    } catch {
      //
    }
    return root;
  } as PatchedFn;

  // Mark the *patched* function with metadata so re-entry sees it
  patched.__v3Patched = true;
  patched.__v3State = state;

  Object.defineProperty(Element.prototype, "attachShadow", {
    configurable: true,
    writable: true,
    value: patched,
  });

  // Optionally tag existing open roots (closed cannot be discovered post-hoc)
  if (opts.tagExisting) {
    try {
      const walker = document.createTreeWalker(
        document,
        NodeFilter.SHOW_ELEMENT,
      );
      while (walker.nextNode()) {
        const el = walker.currentNode as Element;
        if (el.shadowRoot) {
          state.hostToRoot.set(el, el.shadowRoot);
          state.openCount++;
        }
      }
    } catch {
      //
    }
  }

  window.__stagehandV3Injected = true;
  bindBackdoor(state);

  if (state.debug) {
    console.info("[v3-piercer] installed", {
      url: location.href,
      isTop: window.top === window,
      readyState: document.readyState,
    });
  }
}


================================================
FILE: packages/core/lib/v3/dom/rerenderMissingShadows.entry.ts
================================================
import { rerenderMissingShadowHosts } from "./rerenderMissingShadows.runtime.js";

rerenderMissingShadowHosts();


================================================
FILE: packages/core/lib/v3/dom/rerenderMissingShadows.runtime.ts
================================================
export function rerenderMissingShadowHosts(): void {
  try {
    const piercer = window.__stagehandV3__;
    if (!piercer || typeof piercer.getClosedRoot !== "function") return;

    const needsReset: Element[] = [];
    const walker = document.createTreeWalker(document, NodeFilter.SHOW_ELEMENT);
    while (walker.nextNode()) {
      const el = walker.currentNode as Element;
      const tag = el.tagName?.toLowerCase() ?? "";
      if (!tag.includes("-")) continue;
      if (typeof customElements?.get !== "function") continue;
      if (!customElements.get(tag)) continue;
      const hasOpen = !!el.shadowRoot;
      const hasClosed = !!piercer.getClosedRoot(el);
      if (hasOpen || hasClosed) continue;
      needsReset.push(el);
    }

    for (const host of needsReset) {
      try {
        const clone = host.cloneNode(true);
        host.replaceWith(clone);
      } catch {
        // ignore individual failures
      }
    }

    if (piercer.stats && needsReset.length) {
      console.info("[v3-piercer] rerender", { count: needsReset.length });
    }
  } catch (err) {
    console.info("[v3-piercer] rerender error", { message: String(err ?? "") });
  }
}


================================================
FILE: packages/core/lib/v3/dom/screenshotScripts/index.ts
================================================
export { resolveMaskRect } from "./resolveMaskRect.js";


================================================
FILE: packages/core/lib/v3/dom/screenshotScripts/resolveMaskRect.ts
================================================
export type MaskRect = {
  x: number;
  y: number;
  width: number;
  height: number;
  rootToken?: string | null;
};

export function resolveMaskRect(
  this: Element | null,
  maskToken?: string,
): MaskRect | null {
  function safeClosest(el: Element | null, selector: string): Element | null {
    try {
      return el && typeof el.closest === "function"
        ? el.closest(selector)
        : null;
    } catch {
      return null;
    }
  }

  function safeMatches(el: Element | null, selector: string): boolean {
    try {
      return !!el && typeof el.matches === "function" && el.matches(selector);
    } catch {
      return false;
    }
  }

  function findTopLayerRoot(el: Element | null): Element | null {
    const dialog = safeClosest(el, "dialog[open]");
    if (dialog) return dialog;
    const popover = safeClosest(el, "[popover]");
    if (popover && safeMatches(popover, ":popover-open")) return popover;
    return null;
  }

  if (!this || typeof this.getBoundingClientRect !== "function") return null;
  const rect = this.getBoundingClientRect();
  if (!rect) return null;
  const style = window.getComputedStyle(this);
  if (!style) return null;
  if (style.visibility === "hidden" || style.display === "none") return null;
  if (rect.width <= 0 || rect.height <= 0) return null;

  const root = findTopLayerRoot(this);
  if (root) {
    const rootRect = root.getBoundingClientRect();
    if (!rootRect) return null;
    let rootToken: string | null = null;
    if (maskToken) {
      try {
        const existing = root.getAttribute("data-stagehand-mask-root");
        if (existing && existing.startsWith(maskToken)) {
          rootToken = existing;
        } else {
          rootToken =
            maskToken + "_root_" + Math.random().toString(36).slice(2);
          root.setAttribute("data-stagehand-mask-root", rootToken);
        }
      } catch {
        rootToken = null;
      }
    }
    return {
      x:
        rect.left -
        rootRect.left -
        (root.clientLeft || 0) +
        (root.scrollLeft || 0),
      y:
        rect.top - rootRect.top - (root.clientTop || 0) + (root.scrollTop || 0),
      width: rect.width,
      height: rect.height,
      rootToken,
    };
  }

  return {
    x: rect.left + window.scrollX,
    y: rect.top + window.scrollY,
    width: rect.width,
    height: rect.height,
    rootToken: null,
  };
}


================================================
FILE: packages/core/lib/v3/external_clients/aisdk.ts
================================================
import {
  CoreAssistantMessage,
  ModelMessage,
  CoreSystemMessage,
  Tool,
  CoreUserMessage,
  generateObject,
  generateText,
  ImagePart,
  TextPart,
} from "ai";
import type { LanguageModelV2 } from "@ai-sdk/provider";
import { CreateChatCompletionOptions, LLMClient } from "../llm/LLMClient.js";
import { AvailableModel } from "../types/public/index.js";
import { ChatCompletion } from "openai/resources";

export class AISdkClient extends LLMClient {
  public type = "aisdk" as const;
  private model: LanguageModelV2;

  constructor({ model }: { model: LanguageModelV2 }) {
    super(model.modelId as AvailableModel);
    this.model = model;
  }

  async createChatCompletion<T = ChatCompletion>({
    options,
  }: CreateChatCompletionOptions): Promise<T> {
    const formattedMessages: ModelMessage[] = options.messages.map(
      (message) => {
        if (Array.isArray(message.content)) {
          if (message.role === "system") {
            const systemMessage: CoreSystemMessage = {
              role: "system",
              content: message.content
                .map((c) => ("text" in c ? c.text : ""))
                .join("\n"),
            };
            return systemMessage;
          }

          const contentParts = message.content.map((content) => {
            if ("image_url" in content) {
              const imageContent: ImagePart = {
                type: "image",
                image: content.image_url.url,
              };
              return imageContent;
            } else {
              const textContent: TextPart = {
                type: "text",
                text: content.text,
              };
              return textContent;
            }
          });

          if (message.role === "user") {
            const userMessage: CoreUserMessage = {
              role: "user",
              content: contentParts,
            };
            return userMessage;
          } else {
            const textOnlyParts = contentParts.map((part) => ({
              type: "text" as const,
              text: part.type === "image" ? "[Image]" : part.text,
            }));
            const assistantMessage: CoreAssistantMessage = {
              role: "assistant",
              content: textOnlyParts,
            };
            return assistantMessage;
          }
        }

        return {
          role: message.role,
          content: message.content,
        };
      },
    );

    if (options.response_model) {
      const response = await generateObject({
        model: this.model,
        messages: formattedMessages,
        schema: options.response_model.schema,
      });

      return {
        data: response.object,
        usage: {
          prompt_tokens: response.usage.inputTokens ?? 0,
          completion_tokens: response.usage.outputTokens ?? 0,
          reasoning_tokens: response.usage.reasoningTokens ?? 0,
          cached_input_tokens: response.usage.cachedInputTokens ?? 0,
          total_tokens: response.usage.totalTokens ?? 0,
        },
      } as T;
    }

    const tools: Record<string, Tool> = {};

    for (const rawTool of options.tools) {
      tools[rawTool.name] = {
        description: rawTool.description,
        inputSchema: rawTool.parameters,
      } as Tool;
    }

    const response = await generateText({
      model: this.model,
      messages: formattedMessages,
      tools,
    });

    return {
      data: response.text,
      usage: {
        prompt_tokens: response.usage.inputTokens ?? 0,
        completion_tokens: response.usage.outputTokens ?? 0,
        reasoning_tokens: response.usage.reasoningTokens ?? 0,
        cached_input_tokens: response.usage.cachedInputTokens ?? 0,
        total_tokens: response.usage.totalTokens ?? 0,
      },
    } as T;
  }
}


================================================
FILE: packages/core/lib/v3/external_clients/customOpenAI.ts
================================================
/**
 * Welcome to the Stagehand custom OpenAI client!
 *
 * This is a client for models that are compatible with the OpenAI API, like Ollama, Gemini, etc.
 * You can just pass in an OpenAI instance to the client and it will work.
 */

import type { AvailableModel } from "../types/public/model.js";
import { CreateChatCompletionOptions, LLMClient } from "../llm/LLMClient.js";
import OpenAI from "openai";
import type {
  ChatCompletion,
  ChatCompletionAssistantMessageParam,
  ChatCompletionContentPartImage,
  ChatCompletionContentPartText,
  ChatCompletionCreateParamsNonStreaming,
  ChatCompletionMessageParam,
  ChatCompletionSystemMessageParam,
  ChatCompletionUserMessageParam,
} from "openai/resources/chat/completions";
import { toJsonSchema } from "../zodCompat.js";
import { validateZodSchema } from "../../utils.js";
import {
  CreateChatCompletionResponseError,
  ZodSchemaValidationError,
} from "../types/public/sdkErrors.js";

export class CustomOpenAIClient extends LLMClient {
  public type = "openai" as const;
  private client: OpenAI;

  constructor({ modelName, client }: { modelName: string; client: OpenAI }) {
    super(modelName as AvailableModel);
    this.client = client;
    this.modelName = modelName as AvailableModel;
  }

  async createChatCompletion<T = ChatCompletion>({
    options,
    retries = 3,
    logger,
  }: CreateChatCompletionOptions): Promise<T> {
    const { image, requestId, ...optionsWithoutImageAndRequestId } = options;

    // TODO: Implement vision support
    if (image) {
      console.warn(
        "Image provided. Vision is not currently supported for openai",
      );
    }

    logger({
      category: "openai",
      message: "creating chat completion",
      level: 1,
      auxiliary: {
        options: {
          value: JSON.stringify({
            ...optionsWithoutImageAndRequestId,
            requestId,
          }),
          type: "object",
        },
        modelName: {
          value: this.modelName,
          type: "string",
        },
      },
    });

    let responseFormat:
      | ChatCompletionCreateParamsNonStreaming["response_format"]
      | undefined;
    if (options.response_model) {
      responseFormat = {
        type: "json_object",
      };
    }

    /* eslint-disable */
    // Remove unsupported options
    const { response_model, ...openaiOptions } = {
      ...optionsWithoutImageAndRequestId,
      model: this.modelName,
    };

    logger({
      category: "openai",
      message: "creating chat completion",
      level: 1,
      auxiliary: {
        openaiOptions: {
          value: JSON.stringify(openaiOptions),
          type: "object",
        },
      },
    });

    const formattedMessages: ChatCompletionMessageParam[] =
      options.messages.map((message) => {
        if (Array.isArray(message.content)) {
          const contentParts = message.content.map((content) => {
            if ("image_url" in content) {
              const imageContent: ChatCompletionContentPartImage = {
                image_url: {
                  url: content.image_url.url,
                },
                type: "image_url",
              };
              return imageContent;
            } else {
              const textContent: ChatCompletionContentPartText = {
                text: content.text,
                type: "text",
              };
              return textContent;
            }
          });

          if (message.role === "system") {
            const formattedMessage: ChatCompletionSystemMessageParam = {
              ...message,
              role: "system",
              content: contentParts.filter(
                (content): content is ChatCompletionContentPartText =>
                  content.type === "text",
              ),
            };
            return formattedMessage;
          } else if (message.role === "user") {
            const formattedMessage: ChatCompletionUserMessageParam = {
              ...message,
              role: "user",
              content: contentParts,
            };
            return formattedMessage;
          } else {
            const formattedMessage: ChatCompletionAssistantMessageParam = {
              ...message,
              role: "assistant",
              content: contentParts.filter(
                (content): content is ChatCompletionContentPartText =>
                  content.type === "text",
              ),
            };
            return formattedMessage;
          }
        }

        return {
          ...message,
          content: message.content,
        } as ChatCompletionMessageParam;
      });

    if (options.response_model) {
      const schemaJson = JSON.stringify(
        toJsonSchema(options.response_model.schema),
        null,
        2,
      );
      formattedMessages.push({
        role: "user",
        content: `Respond with valid JSON matching this schema:\n${schemaJson}\n\nDo not include any other text, formatting or markdown in your output. Do not include \`\`\` or \`\`\`json in your response. Only the JSON object itself.`,
      });
    }

    const body: ChatCompletionCreateParamsNonStreaming = {
      ...openaiOptions,
      model: this.modelName,
      messages: formattedMessages,
      response_format: responseFormat,
      stream: false,
      tools: options.tools?.map((tool) => ({
        function: {
          name: tool.name,
          description: tool.description,
          parameters: tool.parameters,
        },
        type: "function",
      })),
    };

    const response = await this.client.chat.completions.create(body);

    logger({
      category: "openai",
      message: "response",
      level: 1,
      auxiliary: {
        response: {
          value: JSON.stringify(response),
          type: "object",
        },
        requestId: {
          value: requestId,
          type: "string",
        },
      },
    });

    if (options.response_model) {
      const extractedData = response.choices[0].message.content;
      if (!extractedData) {
        throw new CreateChatCompletionResponseError("No content in response");
      }

      let parsedData: unknown;
      try {
        parsedData = JSON.parse(extractedData);
        validateZodSchema(options.response_model.schema, parsedData);
      } catch (e) {
        const isParseError = e instanceof SyntaxError;
        logger({
          category: "openai",
          message: isParseError
            ? "Response is not valid JSON"
            : "Response failed Zod schema validation",
          level: 0,
        });
        if (retries > 0) {
          return this.createChatCompletion({
            options,
            logger,
            retries: retries - 1,
          });
        }

        if (e instanceof ZodSchemaValidationError) {
          logger({
            category: "openai",
            message: `Error during chat completion: ${e.message}`,
            level: 0,
            auxiliary: {
              errorDetails: {
                value: `Message: ${e.message}${e.stack ? "\nStack: " + e.stack : ""}`,
                type: "string",
              },
              requestId: { value: requestId, type: "string" },
            },
          });
          throw new CreateChatCompletionResponseError(e.message);
        }
        throw new CreateChatCompletionResponseError(
          isParseError
            ? "Failed to parse model response as JSON"
            : e instanceof Error
              ? e.message
              : "Unknown error during response processing",
        );
      }

      return {
        data: parsedData,
        usage: {
          prompt_tokens: response.usage?.prompt_tokens ?? 0,
          completion_tokens: response.usage?.completion_tokens ?? 0,
          total_tokens: response.usage?.total_tokens ?? 0,
        },
      } as T;
    }

    return {
      data: response.choices[0].message.content,
      usage: {
        prompt_tokens: response.usage?.prompt_tokens ?? 0,
        completion_tokens: response.usage?.completion_tokens ?? 0,
        total_tokens: response.usage?.total_tokens ?? 0,
      },
    } as T;
  }
}


================================================
FILE: packages/core/lib/v3/flowlogger/EventEmitter.ts
================================================
import { EventEmitter } from "node:events";

type WildcardEventListener = (...args: unknown[]) => void;

export class EventEmitterWithWildcardSupport extends EventEmitter {
  private readonly wildcardListeners = new Set<WildcardEventListener>();

  override on(
    eventName: string | symbol,
    listener: (...args: unknown[]) => void,
  ): this {
    if (eventName === "*") {
      this.wildcardListeners.add(listener);
      return this;
    }

    return super.on(eventName, listener);
  }

  override off(
    eventName: string | symbol,
    listener: (...args: unknown[]) => void,
  ): this {
    if (eventName === "*") {
      this.wildcardListeners.delete(listener);
      return this;
    }

    return super.off(eventName, listener);
  }

  override emit(eventName: string | symbol, ...args: unknown[]): boolean {
    const handled = super.emit(eventName, ...args);

    for (const listener of this.wildcardListeners) {
      listener(...args);
    }

    return handled || this.wildcardListeners.size > 0;
  }
}


================================================
FILE: packages/core/lib/v3/flowlogger/EventSink.ts
================================================
import fs from "node:fs";
import path from "node:path";
import { FlowEvent } from "./FlowLogger.js";
import type { EventStoreApi, EventStoreQuery } from "./EventStore.js";
import {
  prettifyColorStderrLine,
  prettifyEvent,
  prettifyIsCdpEvent,
  prettifySanitizeEvent,
} from "./prettify.js";

// =============================================================================
// Event Sink Contracts
// =============================================================================

export interface EventSink {
  emit(event: FlowEvent): Promise<void>;
  query(query: EventStoreQuery): Promise<FlowEvent[]>;
  destroy(): Promise<void>;
}

// Checks whether an event matches a query used by queryable sinks. `eventId` matches both the event itself and descendants of that event.
function matchesEventStoreQuery(
  event: FlowEvent,
  query: EventStoreQuery,
): boolean {
  if (query.sessionId && event.sessionId !== query.sessionId) return false;

  if (query.eventId) {
    const matchesEvent =
      event.eventId === query.eventId ||
      event.eventParentIds.includes(query.eventId);
    if (!matchesEvent) {
      return false;
    }
  }

  if (query.eventType) {
    const pattern = new RegExp(
      `^${query.eventType
        .replace(/[.*+?^${}()|[\]\\]/g, "\\$&")
        .replace(/\\\*/g, ".*")}$`,
    );
    if (!pattern.test(event.eventType)) {
      return false;
    }
  }

  return true;
}

// =============================================================================
// File Sink Helpers
// =============================================================================

// Returns true when a file sink's stream is still open and writable.
function isWritable(stream: fs.WriteStream | null): stream is fs.WriteStream {
  return !!(stream && !stream.destroyed && stream.writable);
}

// Writes a serialized event to a file sink and converts callback-style stream completion into a promise.
function writeToStream(stream: fs.WriteStream, value: string): Promise<void> {
  return new Promise<void>((resolve, reject) => {
    try {
      stream.write(value, (error?: Error | null) => {
        if (error) {
          reject(error);
          return;
        }
        resolve();
      });
    } catch (error) {
      reject(error);
    }
  });
}

// =============================================================================
// Event Sink Implementations
// =============================================================================

abstract class FileEventSink implements EventSink {
  private readonly streamPromise: Promise<fs.WriteStream | null>; // Lazily opens the one file stream owned by this sink when the session directory resolves.

  // Creates a best-effort file sink bound to a single session directory.
  constructor(sessionDirPromise: Promise<string | null>, fileName: string) {
    this.streamPromise = sessionDirPromise.then((sessionDir) =>
      sessionDir
        ? fs.createWriteStream(path.join(sessionDir, fileName), { flags: "a" })
        : null,
    );
  }

  protected abstract serialize(event: FlowEvent): Promise<string | null>;

  // Serializes and appends a single event. File sinks are intentionally best-effort and never allowed to affect library execution flow.
  async emit(event: FlowEvent): Promise<void> {
    try {
      const stream = await this.streamPromise;
      if (!isWritable(stream)) {
        return;
      }

      const serialized = await this.serialize(event);
      if (!serialized) {
        return;
      }

      await writeToStream(stream, serialized);
    } catch {
      // best effort only
    }
  }

  // File sinks are write-only and do not support query reads.
  async query(): Promise<FlowEvent[]> {
    return [];
  }

  // Closes the underlying file stream when the owning store shuts down.
  async destroy(): Promise<void> {
    const stream = await this.streamPromise.catch((): null => null);
    if (!isWritable(stream)) {
      return;
    }

    await new Promise<void>((resolve) => {
      stream.end(resolve);
    });
  }
}

export class JsonlFileEventSink extends FileEventSink {
  // Writes full verbatim events to `session_events.jsonl`.
  constructor(sessionDirPromise: Promise<string | null>) {
    super(sessionDirPromise, "session_events.jsonl");
  }

  // Serializes the full event for lossless machine-readable storage.
  protected async serialize(event: FlowEvent): Promise<string> {
    return `${JSON.stringify(event)}\n`;
  }
}

export class PrettyLogFileEventSink extends FileEventSink {
  // Writes human-readable pretty lines to `session_events.log`.
  constructor(
    sessionDirPromise: Promise<string | null>,
    private readonly store: Pick<EventStoreApi, "query">, // Queried during prettification so each line can recover recent ancestry tags.
  ) {
    super(sessionDirPromise, "session_events.log");
  }

  // Pretty-prints the event using recent in-memory ancestry.
  protected async serialize(event: FlowEvent): Promise<string | null> {
    const line = await prettifyEvent(this.store, prettifySanitizeEvent(event));
    return line ? `${line}\n` : null;
  }
}

export class PrettyStderrEventSink implements EventSink {
  // Writes pretty lines to stderr for verbose local debugging. CDP events are intentionally omitted here to keep stderr high-signal.
  constructor(private readonly store: Pick<EventStoreApi, "query">) {} // Queried during prettification so stderr lines can include recent ancestry tags.

  // Best-effort stderr writer used only for interactive debugging output.
  async emit(event: FlowEvent): Promise<void> {
    try {
      if (prettifyIsCdpEvent(event)) {
        return;
      }

      const line = await prettifyEvent(
        this.store,
        prettifySanitizeEvent(event),
      );
      if (!line) {
        return;
      }

      await new Promise<void>((resolve, reject) => {
        try {
          process.stderr.write(
            `${prettifyColorStderrLine(line)}\n`,
            (error?: Error | null) => {
              if (error) {
                reject(error);
                return;
              }
              resolve();
            },
          );
        } catch (error) {
          reject(error);
        }
      });
    } catch {
      // best effort only
    }
  }

  // Stderr sink is write-only and does not support query reads.
  async query(): Promise<FlowEvent[]> {
    return [];
  }

  // No teardown is required for stderr.
  async destroy(): Promise<void> {}
}

export class InMemoryEventSink implements EventSink {
  // Retains recent events for query lookups. Tests usually attach this sink explicitly when they need full historical payloads.
  constructor(protected readonly limit = Infinity) {}

  protected readonly events: FlowEvent[] = []; // Retained history; `emit()` appends to it and trims old entries when `limit` is exceeded.

  // Gives subclasses a hook to transform events before they are retained.
  protected storeEvent(event: FlowEvent): FlowEvent {
    return event;
  }

  // Stores a new event and trims the oldest retained entries once the sink exceeds its configured limit.
  async emit(event: FlowEvent): Promise<void> {
    this.events.push(this.storeEvent(event));
    if (this.events.length > this.limit) {
      this.events.splice(0, this.events.length - this.limit);
    }
  }

  // Returns retained events that match the query, ordered by creation time.
  async query(query: EventStoreQuery): Promise<FlowEvent[]> {
    const filtered = this.events.filter((event) =>
      matchesEventStoreQuery(event, query),
    );
    filtered.sort((left, right) => {
      const createdAtOrder = left.eventCreatedAt.localeCompare(
        right.eventCreatedAt,
      );
      if (createdAtOrder !== 0) {
        return createdAtOrder;
      }

      return left.eventId.localeCompare(right.eventId);
    });
    return query.limit ? filtered.slice(-query.limit) : filtered;
  }

  // Clears retained history when the owning store shuts down.
  async destroy(): Promise<void> {
    this.events.length = 0;
  }
}

export class ShallowInMemoryEventSink extends InMemoryEventSink {
  // Retains only ancestry metadata for the default query sink so verbose or long-running sessions do not hold onto large payloads such as screenshots.
  protected override storeEvent(event: FlowEvent): FlowEvent {
    return new FlowEvent({
      eventType: event.eventType,
      eventId: event.eventId,
      eventCreatedAt: event.eventCreatedAt,
      sessionId: event.sessionId,
      eventParentIds: [...event.eventParentIds],
      data: {},
    });
  }
}


================================================
FILE: packages/core/lib/v3/flowlogger/EventStore.ts
================================================
import fs from "node:fs";
import path from "node:path";
import type { V3Options } from "../types/public/index.js";
import {
  EventSink,
  JsonlFileEventSink,
  PrettyLogFileEventSink,
  PrettyStderrEventSink,
  ShallowInMemoryEventSink,
} from "./EventSink.js";
import { FlowEvent } from "./FlowLogger.js";

const DEFAULT_IN_MEMORY_EVENT_LIMIT = 500; // Per-session ancestry window retained by the default shallow query sink.
const CONFIG_DIR = process.env.BROWSERBASE_CONFIG_DIR || ""; // Base directory for session metadata + file-backed flow logs.
const FLOW_LOGS_ENABLED = process.env.BROWSERBASE_FLOW_LOGS === "1"; // Force-enables the pretty stderr flow sink even when `verbose !== 2`.
const SENSITIVE_KEYS =
  /key|secret|token|api-key|apikey|api_key|password|passwd|pwd|credential|auth/i; // Redacts obvious secrets before session options are written to disk.

// =============================================================================
// Public Contracts
// =============================================================================

export interface EventStoreQuery {
  sessionId?: string;
  eventId?: string;
  eventType?: string;
  limit?: number;
}

export interface EventStoreApi {
  readonly sessionId: string;
  emit(event: FlowEvent): Promise<void>;
  query(query: EventStoreQuery): Promise<FlowEvent[]>;
  destroy(): Promise<void>;
}

// =============================================================================
// Filesystem Helpers
// =============================================================================

// Redacts secrets before session options are written to `session.json` inside a config-dir-backed session directory.
function sanitizeOptions(options: V3Options): Record<string, unknown> {
  const sanitize = (value: unknown): unknown => {
    if (typeof value !== "object" || value === null) return value;
    if (Array.isArray(value)) return value.map(sanitize);

    const result: Record<string, unknown> = {};
    for (const [key, entry] of Object.entries(value)) {
      result[key] = SENSITIVE_KEYS.test(key) ? "******" : sanitize(entry);
    }
    return result;
  };

  return sanitize({ ...options }) as Record<string, unknown>;
}

// Resolves the configured Browserbase config directory used by file sinks.
export function getConfigDir(): string {
  return CONFIG_DIR ? path.resolve(CONFIG_DIR) : "";
}

// Creates the per-session directory used by file sinks and writes best-effort metadata such as the sanitized `session.json` file and `latest` symlink.
async function createSessionDir(
  sessionId: string,
  options?: V3Options,
): Promise<string | null> {
  const configDir = getConfigDir();
  if (!configDir) {
    return null;
  }

  const sessionDir = path.join(configDir, "sessions", sessionId);
  await fs.promises.mkdir(sessionDir, { recursive: true });

  if (options) {
    await fs.promises.writeFile(
      path.join(sessionDir, "session.json"),
      JSON.stringify(sanitizeOptions(options), null, 2),
      "utf-8",
    );
  }

  const latestLink = path.join(configDir, "sessions", "latest");
  try {
    try {
      await fs.promises.unlink(latestLink);
    } catch {
      // ignore missing link
    }
    await fs.promises.symlink(sessionId, latestLink, "dir");
  } catch {
    // symlink best effort only
  }

  return sessionDir;
}

// =============================================================================
// Event Store
// =============================================================================

// Per-session flow event sink manager.
// This is not an event bus. V3 forwards already-emitted FlowEvents into it so
// the store can fan them out to configured sinks, answer `query()` calls from
// its one query sink, and tear down its sinks when the session closes.
// We keep this as a separate object instead of wiring sinks directly with
// `v3.bus.on("*", sink.emit)` because pretty sinks need access to a shared
// query interface while rendering. Prettified lines often need to look up
// related parent/child events to recover the readable ancestry tags and labels.
// Passing sinks into each other to share that state gets messy quickly, so the
// EventStore contains the circular dependency: all sinks live here, and any
// sink that needs historical context can call the one `EventStore.query()`
// entrypoint backed by the main query sink for this session.
export class EventStore implements EventStoreApi {
  private readonly sinks = new Set<EventSink>(); // All sinks attached for this session; constructor registers them here and `destroy()` tears them down.
  private destroyed = false; // Flipped by `destroy()` so later emits and teardown calls become no-ops.
  public query: (query: EventStoreQuery) => Promise<FlowEvent[]>; // Always reads from the one query sink chosen at construction time.

  // Creates the per-instance store owned by a single V3 session. This store is intentionally single-session; it ignores events for other session ids.
  constructor(
    // Usually matches `browserbaseSessionId` today, but it is the store's own Stagehand session identifier and may diverge in the future.
    public readonly sessionId: string,
    options?: V3Options,
    querySink: EventSink = new ShallowInMemoryEventSink(
      DEFAULT_IN_MEMORY_EVENT_LIMIT,
    ),
  ) {
    const sessionDirPromise = createSessionDir(sessionId, options);

    this.registerSink(querySink);
    this.query = async (query) => {
      if (query.sessionId && query.sessionId !== this.sessionId) {
        return [];
      }

      return querySink.query({
        ...query,
        sessionId: this.sessionId,
      });
    };

    if (getConfigDir()) {
      this.registerSink(new JsonlFileEventSink(sessionDirPromise));
      this.registerSink(new PrettyLogFileEventSink(sessionDirPromise, this));
    }

    if (FLOW_LOGS_ENABLED) {
      this.registerSink(new PrettyStderrEventSink(this));
    }
  }

  // Adds a sink to the direct fanout list used by `emit()`.
  private registerSink(sink: EventSink): void {
    this.sinks.add(sink);
  }

  // Emits an event to all attached sinks when it belongs to this store's single session.
  emit = async (event: FlowEvent): Promise<void> => {
    if (!(event instanceof FlowEvent)) {
      return;
    }

    if (this.destroyed || event.sessionId !== this.sessionId) {
      return;
    }

    await Promise.allSettled([...this.sinks].map((sink) => sink.emit(event)));
  };

  // Tears down all sinks when the V3 instance is closed.
  async destroy(): Promise<void> {
    if (this.destroyed) {
      return;
    }

    this.destroyed = true;
    await Promise.all(
      [...this.sinks].map((sink) =>
        sink.destroy().catch(() => {
          // best effort cleanup
        }),
      ),
    );
    this.sinks.clear();
  }
}


================================================
FILE: packages/core/lib/v3/flowlogger/FlowLogger.ts
================================================
import { AsyncLocalStorage } from "node:async_hooks";
import { v7 as uuidv7 } from "uuid";
import type { LanguageModelMiddleware } from "ai";
import { z } from "zod";
import { EventEmitterWithWildcardSupport } from "./EventEmitter.js";

// =============================================================================
// Flow Event Model
// =============================================================================

export const FlowEventDataSchema = z.record(z.string(), z.unknown());
export const FlowEventInputSchema = z.object({
  eventType: z.string(),
  eventId: z.string().optional(),
  eventParentIds: z.array(z.string()).optional(),
  eventCreatedAt: z.string().optional(),
  sessionId: z.string().optional(),
  data: FlowEventDataSchema.optional(),
});

export type FlowEventData = z.infer<typeof FlowEventDataSchema>;
export type FlowEventInput = z.input<typeof FlowEventInputSchema>;

// the same as FlowEventInput, but with all fields required (non-optional)
type FlowEventFields = Omit<
  FlowEventInput,
  "eventId" | "eventParentIds" | "eventCreatedAt" | "sessionId" | "data"
> & {
  eventId: string;
  eventParentIds: string[];
  eventCreatedAt: string;
  sessionId: string;
  data: FlowEventData;
};

export class FlowEvent implements FlowEventFields {
  // "ModuleMethodSomethingEvent" -> hashToSmallInt("Modu) -> 5. eventId = "...5"
  private static deriveEventIdSuffix(eventType: string): string {
    const prefixMatch = eventType.match(/^[A-Z][a-z0-9]*/);
    const prefix = prefixMatch?.[0] ?? eventType.slice(0, 4);

    let hash = 0;
    for (const ch of prefix.slice(0, 4)) {
      hash = (hash * 31 + ch.charCodeAt(0)) % 10;
    }
    return String(hash); // e.g. "0" or "9"
  }

  // Builds a sortable UUID-like event id while preserving a stable, human-friendly suffix derived from the event family.
  static createEventId(eventType: string): string {
    const rawEventId = uuidv7();
    return `${rawEventId.slice(0, -1)}${FlowEvent.deriveEventIdSuffix(eventType)}`;
  }

  // Base required fields for all events:
  eventType: string;
  eventId: string;
  eventParentIds: string[];
  eventCreatedAt: string;
  // `sessionId` usually matches `browserbaseSessionId` today, but FlowLogger treats it as a generic Stagehand session identifier because those may diverge in the future.
  sessionId: string;
  data: FlowEventData; // event payload (e.g. params, action, result, error, etc.)

  // Normalizes the event shape used everywhere in the flow logger pipeline. This is called at emission time right before an event is attached to the event bus and any sinks.
  constructor(input: FlowEventInput) {
    if (!input.sessionId) {
      throw new Error("FlowEvent.sessionId is required.");
    }
    if (input.eventType.endsWith("Event")) {
      this.eventType = input.eventType;
    } else {
      this.eventType = `${input.eventType}Event`;
    }
    this.eventId = input.eventId ?? FlowEvent.createEventId(this.eventType);
    this.eventParentIds = input.eventParentIds ?? [];
    this.eventCreatedAt = input.eventCreatedAt ?? new Date().toISOString();
    this.sessionId = input.sessionId;
    this.data = input.data ?? {};
  }
}

export interface FlowLoggerContext {
  // Mirrors `FlowEvent.sessionId`; it is currently the Stagehand session id and often matches `browserbaseSessionId`, but callers should not rely on that.
  sessionId: string;
  eventBus: EventEmitterWithWildcardSupport; // Shared per-session bus; `emit()` writes to it and V3 forwards wildcard events into the instance-owned EventStore.
  parentEvents: FlowEvent[]; // Active parent stack for the current async chain; wrappers push/pop this as logged work starts and ends.
}

type AsyncOriginalMethod<
  TArgs extends unknown[] = unknown[],
  TResult = unknown,
  TThis = unknown,
> = (this: TThis, ...args: TArgs) => Promise<TResult>;

type FlowLoggerLogOptions = FlowEventInput & {
  context?: FlowLoggerContext;
};

// AsyncLocalStorage is the authoritative source for the active flow parent stack inside a single async call-chain.
const loggerContext = new AsyncLocalStorage<FlowLoggerContext>();

// Converts raw inline image/base64 payload lengths into a compact kb string for LLM prompt summaries.
function dataToKb(data: string): string {
  return ((data.length * 0.75) / 1024).toFixed(1);
}

// =============================================================================
// Flow Logger Internals
// =============================================================================

type CdpLogEventType = "call" | "response" | "responseError" | "message";

type CdpLogPayload = {
  method: string;
  params?: unknown;
  result?: unknown;
  error?: string;
  targetId?: string | null;
};

const CDP_EVENT_NAMES: Record<CdpLogEventType, string> = {
  call: "CdpCallEvent",
  response: "CdpResponseEvent",
  responseError: "CdpResponseErrorEvent",
  message: "CdpMessageEvent",
};

export class FlowLogger {
  // Copies the mutable parts of a context before it is re-entered in a later async callback. This prevents later parent-stack mutations from leaking backward into stored snapshots.
  private static cloneContext(ctx: FlowLoggerContext): FlowLoggerContext {
    return {
      ...ctx,
      parentEvents: ctx.parentEvents.map((event) => ({
        ...event,
        eventParentIds: [...event.eventParentIds],
      })),
    };
  }

  // Chooses the safest context to re-enter when callers already have a stored context
  // and ALS may or may not already contain one for the same session.
  // If the current ALS stack extends the stored stack, we keep the richer ALS view.
  // If the stored stack is deeper, we preserve that instead.
  // If they diverge, we prefer the current ALS view because it reflects the currently executing call-chain.
  private static resolveReentryContext(
    context: FlowLoggerContext,
  ): FlowLoggerContext {
    const currentContext = loggerContext.getStore() ?? null;
    // If ALS is empty or belongs to another session, the caller's stored
    // snapshot is the only safe context we can re-enter.
    if (!currentContext || currentContext.sessionId !== context.sessionId) {
      return FlowLogger.cloneContext(context);
    }

    const providedParentIds = context.parentEvents.map(
      (event) => event.eventId,
    );
    const currentParentIds = currentContext.parentEvents.map(
      (event) => event.eventId,
    );
    const currentExtendsProvided = providedParentIds.every(
      (eventId, index) => currentParentIds[index] === eventId,
    );
    // ALS already has the provided chain as a prefix, so we keep the richer
    // currently-executing stack instead of truncating it.
    if (currentExtendsProvided) {
      return FlowLogger.cloneContext(currentContext);
    }

    const providedExtendsCurrent = currentParentIds.every(
      (eventId, index) => providedParentIds[index] === eventId,
    );
    // The stored snapshot is deeper than the current ALS stack, which usually
    // means we are re-entering from a later async callback and need to restore
    // the missing parent chain.
    if (providedExtendsCurrent) {
      return FlowLogger.cloneContext(context);
    }

    // If the two chains diverged, prefer the live ALS chain because it reflects
    // the work currently executing on this async path.
    return FlowLogger.cloneContext(currentContext);
  }

  // Materializes and emits a single flow event on the active ALS context.
  // This is the lowest-level write path used by all higher-level logging helpers
  // after they have decided which parent chain and session the event belongs to.
  private static emit(event: FlowEventInput): FlowEvent | null {
    const ctx = FlowLogger.currentContext;

    const emittedEvent = new FlowEvent({
      ...event,
      eventParentIds:
        event.eventParentIds ??
        ctx.parentEvents.map((parent) => parent.eventId),
      sessionId: ctx.sessionId,
    });
    ctx.eventBus.emit(emittedEvent.eventType, emittedEvent);
    return emittedEvent;
  }

  // Wraps a unit of async work with started/completed/error events while maintaining
  // the parent stack inside the active context.
  private static async runWithAutoStatusEventLogging<TResult>(
    options: FlowLoggerLogOptions,
    originalMethod: AsyncOriginalMethod<[], TResult>,
  ): Promise<TResult> {
    const ctx = FlowLogger.currentContext;
    const { data, eventParentIds, eventType } = options;
    let caughtError: unknown = null;

    // if eventParentIds is explicitly [], this is a root event, clear the parent events in context
    if (eventParentIds && eventParentIds.length === 0) {
      ctx.parentEvents = [];
    }

    const startedEvent = FlowLogger.emit({
      eventType,
      data,
      eventParentIds,
    });

    // Push after emitting so nested work sees this event as its direct parent
    // for the rest of the wrapped method's lifetime.
    ctx.parentEvents.push(startedEvent);

    try {
      return await originalMethod();
    } catch (error) {
      caughtError = error;
      // Error events attach directly under the started event even though the
      // stack is still live, so the failure edge is explicit in the tree.
      FlowLogger.emit({
        eventType: `${eventType}ErrorEvent`,
        eventParentIds: [...startedEvent.eventParentIds, startedEvent.eventId],
        data: {
          error: error instanceof Error ? error.message : String(error),
          durationMs:
            Date.now() - new Date(startedEvent.eventCreatedAt).getTime(),
        },
      });
      throw error;
    } finally {
      // Pop only the frame owned by this wrapper. If nested code has already
      // mutated the stack unexpectedly, we skip the completed event rather than
      // emitting a misleading lifecycle edge.
      const parentEvent = ctx.parentEvents.pop();
      if (parentEvent?.eventId === startedEvent.eventId && !caughtError) {
        FlowLogger.emit({
          eventType: `${eventType}CompletedEvent`,
          eventParentIds: [
            ...startedEvent.eventParentIds,
            startedEvent.eventId,
          ],
          data: {
            durationMs:
              Date.now() - new Date(startedEvent.eventCreatedAt).getTime(),
          },
        });
      }
    }
  }

  // Emits a CDP event under a caller-supplied context. CDP transport code uses this
  // instead of `runWithLogging()` because request/response/message events
  // are separate lifecycle edges with explicit parent ids.
  private static logCdpEvent(
    context: FlowLoggerContext,
    eventType: CdpLogEventType,
    { method, params, result, error, targetId }: CdpLogPayload,
    eventParentIds?: string[],
  ): FlowEvent | null {
    if (method.endsWith(".enable") || method === "enable") {
      return null;
    }

    if (eventType === "message" && FlowLogger.NOISY_CDP_EVENTS.has(method)) {
      return null;
    }

    return loggerContext.run(FlowLogger.cloneContext(context), () =>
      FlowLogger.emit({
        eventType: CDP_EVENT_NAMES[eventType],
        eventParentIds,
        data: {
          method,
          params,
          result,
          error,
          targetId,
        },
      }),
    );
  }

  // Emits an LLM request/response event only when a flow context is active.
  // LLM logging is best-effort, so callers should not fail if it is invoked outside a tracked async chain.
  private static emitLlmEvent(event: FlowEventInput): void {
    const context = FlowLogger.resolveContext();
    if (!context) {
      return;
    }

    loggerContext.run(context, () => {
      FlowLogger.emit(event);
    });
  }

  // Builds the one-line prompt summary used in LLM request events for AI SDK middleware calls.
  private static buildMiddlewarePromptSummary(params: {
    prompt?: unknown;
    tools?: unknown;
  }): string {
    const toolCount = Array.isArray(params.tools) ? params.tools.length : 0;
    const messages = (params.prompt ?? []) as Array<{
      role?: string;
      content?: unknown;
    }>;
    const lastMsg = messages
      .filter((message) => message.role !== "system")
      .pop();
    let rolePrefix = lastMsg?.role ?? "?";
    let promptSummary = `(no text) +{${toolCount} tools}`;

    if (!lastMsg) {
      return `?: ${promptSummary}`;
    }

    if (typeof lastMsg.content === "string") {
      promptSummary = `${lastMsg.content} +{${toolCount} tools}`;
    } else if (Array.isArray(lastMsg.content)) {
      const toolResult = (
        lastMsg.content as Array<{
          type?: string;
          toolName?: string;
          output?: { type?: string; value?: unknown };
        }>
      ).find((part) => part.type === "tool-result");

      if (toolResult) {
        rolePrefix = `tool result: ${toolResult.toolName}()`;
        if (toolResult.output?.type === "json" && toolResult.output.value) {
          promptSummary = `${JSON.stringify(toolResult.output.value)} +{${toolCount} tools}`;
        } else if (Array.isArray(toolResult.output?.value)) {
          promptSummary = `${
            extractLlmMessageSummary({
              content: toolResult.output.value,
            }) ?? "(no text)"
          } +{${toolCount} tools}`;
        }
      } else {
        promptSummary = `${
          extractLlmMessageSummary({ content: lastMsg.content }) ?? "(no text)"
        } +{${toolCount} tools}`;
      }
    }

    return `${rolePrefix}: ${promptSummary}`;
  }

  // Builds the one-line output summary used in LLM response events for AI SDK middleware calls.
  private static buildMiddlewareOutputSummary(result: {
    text?: string;
    content?: unknown;
    toolCalls?: unknown[];
  }): string {
    let outputSummary = result.text || "";
    if (!outputSummary && result.content) {
      if (typeof result.content === "string") {
        outputSummary = result.content;
      } else if (Array.isArray(result.content)) {
        outputSummary = (
          result.content as Array<{
            type?: string;
            text?: string;
            toolName?: string;
          }>
        )
          .map((contentPart) => {
            if (contentPart.text) {
              return contentPart.text;
            }

            if (contentPart.type === "tool-call") {
              return `tool call: ${contentPart.toolName}()`;
            }

            return `[${contentPart.type}]`;
          })
          .join(" ");
      }
    }

    if (!outputSummary && result.toolCalls?.length) {
      return `[${result.toolCalls.length} tool calls]`;
    }

    return outputSummary || "[empty]";
  }

  // =============================================================================
  // Flow Logger Public Lifecycle API
  // =============================================================================

  // Initialize a new logging context. Call this at the start of a session.
  static init(
    sessionId: string,
    eventBus: EventEmitterWithWildcardSupport,
  ): FlowLoggerContext {
    const ctx: FlowLoggerContext = {
      sessionId,
      eventBus,
      parentEvents: [],
    };

    loggerContext.enterWith(ctx);
    return ctx;
  }

  // Clears the parent stack for a session when a V3 instance shuts down.
  // This does not emit a final event; it just tears down in-memory context.
  static async close(context?: FlowLoggerContext | null): Promise<void> {
    const ctx = context ?? loggerContext.getStore() ?? null;
    if (!ctx) return;
    ctx.parentEvents = [];
  }

  // Returns the current ALS-backed flow context and throws when code
  // executes outside a tracked flow. Use `resolveContext()` for best-effort lookups.
  static get currentContext(): FlowLoggerContext {
    const ctx = loggerContext.getStore() ?? null;
    if (!ctx) {
      throw new Error("FlowLogger context is missing.");
    }

    return ctx;
  }

  // Returns a cloned FlowLogger context for the current async call-chain when one exists,
  // otherwise falls back to the provided instance-owned context.
  // This is the non-throwing lookup for callers that can continue without ALS.
  static resolveContext(
    fallbackContext?: FlowLoggerContext | null,
  ): FlowLoggerContext | null {
    const currentContext = loggerContext.getStore() ?? null;
    if (currentContext) {
      return FlowLogger.cloneContext(currentContext);
    }

    return fallbackContext ? FlowLogger.cloneContext(fallbackContext) : null;
  }

  // Decorator-style wrapper used on class methods that should emit their own started/completed/error envelope.
  // It resolves the flow context from either the decorator options or `this.flowLoggerContext`,
  // then delegates the actual lifecycle handling to `runWithLogging()`.
  static wrapWithLogging<TMethod extends AsyncOriginalMethod>(
    options: FlowLoggerLogOptions,
  ) {
    return function <
      TWrappedMethod extends AsyncOriginalMethod<
        Parameters<TMethod>,
        Awaited<ReturnType<TMethod>>,
        ThisParameterType<TMethod>
      >,
    >(originalMethod: TWrappedMethod): TWrappedMethod {
      const wrappedMethod = async function (
        this: ThisParameterType<TWrappedMethod>,
        ...args: Parameters<TWrappedMethod>
      ): Promise<Awaited<ReturnType<TWrappedMethod>>> {
        let context = options.context;
        if (!context) {
          context = (
            this as { flowLoggerContext?: FlowLoggerContext } | null | undefined
          )?.flowLoggerContext;
        }

        return await FlowLogger.runWithLogging(
          {
            ...options,
            context,
          },
          (...boundArgs: Parameters<TWrappedMethod>) =>
            originalMethod.apply(this, boundArgs) as Promise<
              Awaited<ReturnType<TWrappedMethod>>
            >,
          args,
        );
      };

      return wrappedMethod as unknown as TWrappedMethod;
    };
  }

  // Wraps an async function or zero-arg closure with flow events.
  // This is the imperative entrypoint used by handlers that cannot use the decorator form.
  // Standard case: the logged params are the same tuple passed to the wrapped method.
  static runWithLogging<TMethod extends AsyncOriginalMethod>(
    options: FlowLoggerLogOptions,
    originalMethod: TMethod,
    params: Readonly<Parameters<TMethod>>,
  ): Promise<Awaited<ReturnType<TMethod>>>;
  // Special case: log an arbitrary params tuple while executing a zero-arg closure.
  static runWithLogging<TResult>(
    options: FlowLoggerLogOptions,
    originalMethod: AsyncOriginalMethod<[], TResult>,
    params: ReadonlyArray<unknown>,
  ): Promise<Awaited<TResult>>;
  static runWithLogging(
    options: FlowLoggerLogOptions,
    originalMethod: AsyncOriginalMethod<unknown[], unknown>,
    params: ReadonlyArray<unknown>,
  ): Promise<unknown> {
    const eventData = {
      ...(options.data ?? {}),
      params: [...params],
    };

    const execute = (): Promise<unknown> =>
      FlowLogger.runWithAutoStatusEventLogging(
        {
          ...options,
          data: eventData,
        },
        () => originalMethod(...params),
      );

    // No explicit context and no active ALS means there is nothing to attach
    // this work to, so we leave execution untouched instead of fabricating a
    // root event.
    if (!options.context && !(loggerContext.getStore() ?? null)) {
      return originalMethod(...params);
    }

    if (options.context) {
      // Re-enter the caller-owned context so wrapper events land under the same
      // session tree even when this code executes outside the original ALS
      // chain.
      return loggerContext.run(
        FlowLogger.resolveReentryContext(options.context),
        execute,
      );
    }

    return execute();
  }

  // Re-enters an existing FlowLogger context without emitting wrapper events.
  // Use this when work already belongs to a known parent and needs AsyncLocalStorage set manually.
  static withContext<T>(context: FlowLoggerContext, fn: () => T): T {
    return loggerContext.run(FlowLogger.resolveReentryContext(context), fn);
  }

  // ===========================================================================
  // CDP Events
  // ===========================================================================

  private static readonly NOISY_CDP_EVENTS = new Set([
    "Target.targetInfoChanged",
    "Runtime.executionContextCreated",
    "Runtime.executionContextDestroyed",
    "Runtime.executionContextsCleared",
    "Page.lifecycleEvent",
    "Network.dataReceived",
    "Network.loadingFinished",
    "Network.requestWillBeSentExtraInfo",
    "Network.responseReceivedExtraInfo",
    "Network.requestWillBeSent",
    "Network.responseReceived",
  ]);

  // Logs the start of a CDP command. CDP transport calls this before sending a
  // message over the websocket so the eventual response can attach to it.
  static logCdpCallEvent(
    context: FlowLoggerContext,
    data: {
      method: string;
      params?: object;
      targetId?: string | null;
    },
  ): FlowEvent | null {
    return FlowLogger.logCdpEvent(context, "call", data);
  }

  // Logs the terminal response for a previously emitted CDP call event.
  static logCdpResponseEvent(
    context: FlowLoggerContext,
    parentEvent: Pick<FlowEvent, "eventId" | "eventParentIds">,
    data: {
      method: string;
      result?: unknown;
      error?: string;
      targetId?: string | null;
    },
  ): void {
    FlowLogger.logCdpEvent(
      context,
      data.error ? "responseError" : "response",
      data,
      [...parentEvent.eventParentIds, parentEvent.eventId],
    );
  }

  // Logs an unsolicited CDP message under the most recent related call event.
  static logCdpMessageEvent(
    context: FlowLoggerContext,
    parentEvent: Pick<FlowEvent, "eventId" | "eventParentIds">,
    data: {
      method: string;
      params?: unknown;
      targetId?: string | null;
    },
  ): void {
    FlowLogger.logCdpEvent(context, "message", data, [
      ...parentEvent.eventParentIds,
      parentEvent.eventId,
    ]);
  }

  // ===========================================================================
  // LLM Events
  // ===========================================================================

  // Emits a best-effort LLM request event when logging occurs inside an active flow context.
  static logLlmRequest({
    requestId,
    model,
    prompt,
  }: {
    requestId: string;
    model: string;
    prompt?: string;
  }): void {
    FlowLogger.emitLlmEvent({
      eventType: "LlmRequestEvent",
      data: {
        requestId,
        model,
        prompt,
      },
    });
  }

  // Emits a best-effort LLM response event when logging occurs inside an active flow context.
  static logLlmResponse({
    requestId,
    model,
    output,
    inputTokens,
    outputTokens,
  }: {
    requestId: string;
    model: string;
    output?: string;
    inputTokens?: number;
    outputTokens?: number;
  }): void {
    FlowLogger.emitLlmEvent({
      eventType: "LlmResponseEvent",
      data: {
        requestId,
        model,
        output,
        inputTokens,
        outputTokens,
      },
    });
  }

  // ===========================================================================
  // LLM Logging Middleware
  // ===========================================================================

  // Creates AI SDK middleware that wraps a generate call with FlowLogger LLM request/response events
  // while leaving model execution behavior unchanged.
  static createLlmLoggingMiddleware(
    modelId: string,
  ): Pick<LanguageModelMiddleware, "wrapGenerate"> {
    return {
      wrapGenerate: async ({ doGenerate, params }) => {
        const llmRequestId = uuidv7();
        FlowLogger.logLlmRequest({
          requestId: llmRequestId,
          model: modelId,
          prompt: FlowLogger.buildMiddlewarePromptSummary(params),
        });

        const result = await doGenerate();

        const res = result as {
          text?: string;
          content?: unknown;
          toolCalls?: unknown[];
        };

        FlowLogger.logLlmResponse({
          requestId: llmRequestId,
          model: modelId,
          output: FlowLogger.buildMiddlewareOutputSummary(res),
          inputTokens: result.usage?.inputTokens,
          outputTokens: result.usage?.outputTokens,
        });

        return result;
      },
    };
  }
}

// =============================================================================
// LLM Event Extraction Helpers
// =============================================================================

type ContentPart = {
  type?: string;
  text?: string;
  content?: unknown[];
  source?: { data?: string };
  image_url?: { url?: string };
  inlineData?: { data?: string };
};

type LlmMessageContent = {
  content?: unknown;
  text?: string;
  parts?: unknown[];
};

// Extracts text and image markers from an LLM content array.
// This is shared by the request-summary helpers below so different provider message
// shapes render consistently in the flow log.
function extractLlmMessageContent(content: unknown[]): {
  text?: string;
  extras: string[];
} {
  const result = {
    text: undefined as string | undefined,
    extras: [] as string[],
  };

  for (const part of content) {
    const p = part as ContentPart;
    // Text
    if (!result.text && p.text) {
      result.text = p.type === "text" || !p.type ? p.text : undefined;
    }
    // Images - various formats
    if (p.type === "image" || p.type === "image_url") {
      const url = p.image_url?.url;
      if (url?.startsWith("data:"))
        result.extras.push(`${dataToKb(url)}kb image`);
      else if (p.source?.data)
        result.extras.push(`${dataToKb(p.source.data)}kb image`);
      else result.extras.push("image");
    } else if (p.source?.data) {
      result.extras.push(`${dataToKb(p.source.data)}kb image`);
    } else if (p.inlineData?.data) {
      result.extras.push(`${dataToKb(p.inlineData.data)}kb image`);
    }
    // Recurse into tool_result content
    if (p.type === "tool_result" && Array.isArray(p.content)) {
      const nested = extractLlmMessageContent(p.content);
      if (!result.text && nested.text) {
        result.text = nested.text;
      }
      result.extras.push(...nested.extras);
    }
  }

  return result;
}

// Produces a single compact summary from a provider-specific message payload
// so request and tool-result logs stay readable.
function extractLlmMessageSummary(
  input: LlmMessageContent,
  options?: {
    trimInstructionPrefix?: boolean;
    extras?: string[];
  },
): string | undefined {
  const result = {
    text: undefined as string | undefined,
    extras: [...(options?.extras ?? [])],
  };

  if (typeof input.content === "string") {
    result.text = input.content;
  } else if (typeof input.text === "string") {
    result.text = input.text;
  } else if (Array.isArray(input.parts)) {
    const summary = extractLlmMessageContent(input.parts);
    result.text = summary.text;
    result.extras.push(...summary.extras);
  } else if (Array.isArray(input.content)) {
    const summary = extractLlmMessageContent(input.content);
    result.text = summary.text;
    result.extras.push(...summary.extras);
  }

  if (options?.trimInstructionPrefix && result.text) {
    result.text = result.text.replace(/^[Ii]nstruction: /, "");
  }

  const text = result.text;
  if (!text && result.extras.length === 0) return undefined;

  let summary = text || "";
  if (result.extras.length > 0) {
    const extrasStr = result.extras.map((e) => `+{${e}}`).join(" ");
    summary = summary ? `${summary} ${extrasStr}` : extrasStr;
  }
  return summary || undefined;
}

// Formats the last user-facing prompt into the one-line form used by standard LLM request logs,
// for example: `some text +{5.8kb image} +{schema}`.
export function extractLlmPromptSummary(
  messages: Array<{ role: string; content: unknown }>,
  options?: { toolCount?: number; hasSchema?: boolean },
): string | undefined {
  try {
    const lastUserMsg = messages.filter((m) => m.role === "user").pop();
    if (!lastUserMsg) return undefined;

    return extractLlmMessageSummary(lastUserMsg, {
      trimInstructionPrefix: true,
      extras: [
        ...(options?.hasSchema ? ["schema"] : []),
        ...(options?.toolCount ? [`${options.toolCount} tools`] : []),
      ],
    });
  } catch {
    return undefined;
  }
}

// Extract a text summary from CUA-style messages. This accepts Anthropic, OpenAI, and Google-style payloads.
export function extractLlmCuaPromptSummary(
  messages: unknown[],
): string | undefined {
  try {
    const lastMsg = messages
      .filter((m) => {
        const msg = m as { role?: string; type?: string };
        return msg.role === "user" || msg.type === "tool_result";
      })
      .pop() as
      | { content?: unknown; parts?: unknown[]; text?: string }
      | undefined;

    if (!lastMsg) return undefined;

    return extractLlmMessageSummary(lastMsg);
  } catch {
    return undefined;
  }
}

// Formats the response side of a CUA exchange into a single short log line.
export function extractLlmCuaResponseSummary(output: unknown): string {
  try {
    const items: unknown[] =
      (output as { candidates?: [{ content?: { parts?: unknown[] } }] })
        ?.candidates?.[0]?.content?.parts ??
      (Array.isArray(output) ? output : []);

    const summary = items
      .map((item) => {
        const i = item as {
          type?: string;
          text?: string;
          name?: string;
          functionCall?: { name?: string };
        };
        if (i.text) return i.text;
        if (i.functionCall?.name) return i.functionCall.name;
        if (i.type === "tool_use" && i.name) return i.name;
        return i.type ?? "[item]";
      })
      .join(" ");

    return summary;
  } catch {
    return "[error]";
  }
}


================================================
FILE: packages/core/lib/v3/flowlogger/prettify.ts
================================================
import { toTitleCase } from "../../utils.js";
import { FlowEvent } from "./FlowLogger.js";
import type { EventStoreApi } from "./EventStore.js";

const MAX_LINE_LENGTH = 160; // Maximum width for a prettified log line.

// =============================================================================
// Pretty Formatting
// =============================================================================

// All functions in this section intentionally share the `prettify` prefix so the formatting pipeline is easy to scan and reason about in one place.

// Sanitizes individual values before they are included in prettified output. This currently shortens CDP ids but otherwise preserves structure.
function prettifySanitizeValue(value: unknown): unknown {
  if (typeof value === "string") {
    return truncateCdpIds(value);
  }

  if (Array.isArray(value)) {
    return value.map((entry) => prettifySanitizeValue(entry));
  }

  if (value && typeof value === "object") {
    return Object.fromEntries(
      Object.entries(value).map(([key, entry]) => [
        key,
        prettifySanitizeValue(entry),
      ]),
    );
  }

  return value;
}

// Produces a prettified-safe copy of the event without mutating the original event that other sinks may still need to serialize verbatim.
export function prettifySanitizeEvent(event: FlowEvent): FlowEvent {
  if (!event.eventType.startsWith("Cdp")) {
    return event;
  }

  return {
    ...event,
    data: prettifySanitizeValue(event.data) as Record<string, unknown>,
  };
}

// Collapses newlines and tabs, then truncates a string to the configured pretty log width while preserving the tail for ids and result summaries.
function prettifyTruncateLine(value: string, maxLen: number): string {
  const collapsed = value.replace(/[\r\n\t]+/g, " ");
  if (collapsed.length <= maxLen) {
    return collapsed;
  }

  const endLen = Math.floor(maxLen * 0.3);
  const startLen = maxLen - endLen - 1;
  return `${collapsed.slice(0, startLen)}…${collapsed.slice(-endLen)}`;
}

// Converts any event argument into a compact string representation for pretty logs.
function prettifyFormatValue(value: unknown): string {
  if (typeof value === "string") return `'${value}'`;
  if (value == null || typeof value !== "object") return String(value);

  try {
    return JSON.stringify(value);
  } catch {
    return "[unserializable]";
  }
}

// Formats one or more call arguments into a comma-separated pretty string.
function prettifyFormatArgs(args?: unknown | unknown[]): string {
  if (args === undefined) {
    return "";
  }

  return (Array.isArray(args) ? args : [args])
    .filter((entry) => entry !== undefined)
    .map(prettifyFormatValue)
    .filter((entry) => entry.length > 0)
    .join(", ");
}

// Returns the short id fragment used by pretty tags.
function shortId(id: string | null | undefined): string {
  return id ? id.slice(-4) : "-";
}

// Shortens 32-character CDP ids so pretty logs stay readable while still leaving enough information to correlate related targets.
function truncateCdpIds(value: string): string {
  return value.replace(
    /([iI]d:?"?)([0-9A-F]{32})(?="?[,})\s]|$)/g,
    (_, prefix: string, id: string) =>
      `${prefix}${id.slice(0, 4)}…${id.slice(-4)}`,
  );
}

let nonce = 0;

// Formats timestamps for pretty logs while appending a tiny nonce so lines emitted in the same millisecond remain stable and sortable.
function prettifyFormatTimestamp(date: Date): string {
  const pad = (value: number, width = 2) => String(value).padStart(width, "0");
  return `${date.getFullYear()}-${pad(date.getMonth() + 1)}-${pad(date.getDate())} ${pad(date.getHours())}:${pad(date.getMinutes())}:${pad(date.getSeconds())}.${pad(date.getMilliseconds(), 3)}${pad(nonce++ % 100)}`;
}

// Removes noisy quoting artifacts from the final pretty line.
function prettifyRemoveQuotes(value: string): string {
  return value
    .replace(/([^\\])["']/g, "$1")
    .replace(/^["']|["']$/g, "")
    .trim();
}

// Strips event lifecycle suffixes so related started/completed/error variants can be grouped under one logical operation name.
function prettifyEventName(eventType: string): string {
  return eventType
    .replace(/CompletedEvent$/, "")
    .replace(/ErrorEvent$/, "")
    .replace(/Event$/, "");
}

// Extracts the operation name from a Stagehand/Page/Understudy/Agent event.
function prettifyEventAction(eventType: string): string {
  return prettifyEventName(eventType)
    .replace(/^Agent/, "")
    .replace(/^Stagehand/, "")
    .replace(/^Understudy/, "")
    .replace(/^Page/, "");
}

// Formats `Target.method(args)` style entries while gracefully handling events whose action portion is intentionally blank, such as `StagehandEvent`.
function prettifyFormatMethodCall(
  target: string,
  method: string,
  args: unknown,
): string {
  const member = method ? `.${method[0].toLowerCase()}${method.slice(1)}` : "";
  return `▷ ${target}${member}(${prettifyFormatEventArgs(args)})`;
}

// Marks agent lifecycle events for ancestry tags.
function prettifyIsAgentEvent(event: FlowEvent): boolean {
  return prettifyEventName(event.eventType).startsWith("Agent");
}

// Marks Stagehand lifecycle events for ancestry tags.
function prettifyIsStagehandEvent(event: FlowEvent): boolean {
  return prettifyEventName(event.eventType).startsWith("Stagehand");
}

// Marks page and Understudy actions for the action tag.
function prettifyIsActionEvent(event: FlowEvent): boolean {
  return /^(Page|Understudy)/.test(prettifyEventName(event.eventType));
}

// Routes transport-level CDP traffic to the CDP formatter.
export function prettifyIsCdpEvent(event: FlowEvent): boolean {
  return prettifyEventName(event.eventType).startsWith("Cdp");
}

// Routes LLM request/response events to the LLM formatter.
function prettifyIsLlmEvent(event: FlowEvent): boolean {
  return prettifyEventName(event.eventType).startsWith("Llm");
}

// Completed events should inherit tags from the started operation.
function prettifyIsCompletedEvent(event: FlowEvent): boolean {
  return event.eventType.endsWith("CompletedEvent");
}

// Error events should inherit tags from the started operation.
function prettifyIsErrorEvent(event: FlowEvent): boolean {
  return event.eventType.endsWith("ErrorEvent");
}

// Renders the bracketed pretty tag used in stderr/file pretty logs.
function prettifyFormatTag(
  label: string | null | undefined,
  id: string | null | undefined,
  icon: string,
): string {
  return id ? `[${icon} #${shortId(id)}${label ? ` ${label}` : ""}]` : "⤑";
}

// Formats duration values stored on completed/error events.
function prettifyFormatDuration(durationMs?: unknown): string | null {
  return typeof durationMs === "number"
    ? `${(durationMs / 1000).toFixed(2)}s`
    : null;
}

// Summarizes a prompt or output payload down to a single displayable string for the LLM pretty formatter.
function prettifySummarizePrompt(value: unknown): string | undefined {
  if (typeof value === "string") {
    return prettifyTruncateLine(value, MAX_LINE_LENGTH / 2);
  }

  if (value == null) {
    return undefined;
  }

  return prettifyTruncateLine(prettifyFormatValue(value), MAX_LINE_LENGTH / 2);
}

// Replaces large object references from live runtime objects with placeholders before they are stringified for pretty output.
function prettifyCompactValue(value: unknown): unknown {
  if (typeof value !== "object" || value === null) {
    return value;
  }

  if (Array.isArray(value)) {
    return value.map((entry) => prettifyCompactValue(entry));
  }

  const result: Record<string, unknown> = {};
  for (const [key, entry] of Object.entries(value)) {
    if (
      key === "page" ||
      key === "frame" ||
      key === "locator" ||
      key === "conn" ||
      key === "mainSession" ||
      key === "sessions" ||
      key === "registry" ||
      key === "networkManager" ||
      key === "apiClient"
    ) {
      result[key] = `[${toTitleCase(key)}]`;
      continue;
    }

    result[key] = prettifyCompactValue(entry);
  }

  return result;
}

// Formats event arguments after compacting any live object references.
function prettifyFormatEventArgs(args?: unknown | unknown[]): string {
  return prettifyFormatArgs(prettifyCompactValue(args) as unknown | unknown[]);
}

// Finds the nearest event in the current parent chain that satisfies the given predicate. Pretty tags use this to recover agent/stagehand/action/llm ancestry.
function prettifyFindNearestEvent(
  event: FlowEvent,
  parentMap: Map<string, FlowEvent>,
  predicate: (candidate: FlowEvent) => boolean,
  options?: { includeSelf?: boolean },
): FlowEvent | null {
  if (options?.includeSelf !== false && predicate(event)) {
    return event;
  }

  for (let index = event.eventParentIds.length - 1; index >= 0; index -= 1) {
    const parent = parentMap.get(event.eventParentIds[index]);
    if (parent && predicate(parent)) {
      return parent;
    }
  }

  return null;
}

// Builds the semantic ancestry tags shown on each pretty log line.
// 2026-03-16 22:04:15.45540 [🅰 #1083] [🆂 #7bf4 ACT] [🆄 #2125 CLICK] [🅲 #8B8B CDP] ⏴ Network.policyUpdated({})
function prettifyBuildContextTags(
  event: FlowEvent,
  parentMap: Map<string, FlowEvent>,
): string[] {
  // Completed/error events should inherit tags from their started parent so the completion line points back to the original operation id.
  const includeSelf =
    !prettifyIsCompletedEvent(event) && !prettifyIsErrorEvent(event);
  const agentEvent = prettifyFindNearestEvent(
    event,
    parentMap,
    prettifyIsAgentEvent,
    { includeSelf },
  );
  const stagehandEvent = prettifyFindNearestEvent(
    event,
    parentMap,
    prettifyIsStagehandEvent,
    { includeSelf },
  );
  const actionEvent = prettifyFindNearestEvent(
    event,
    parentMap,
    prettifyIsActionEvent,
    { includeSelf },
  );
  const llmEvent = prettifyFindNearestEvent(
    event,
    parentMap,
    prettifyIsLlmEvent,
    {
      includeSelf,
    },
  );

  let targetId: string | null = null;
  if (typeof event.data.targetId === "string") {
    targetId = event.data.targetId;
  }

  let stagehandLabel = "";
  if (stagehandEvent) {
    stagehandLabel = prettifyEventAction(
      stagehandEvent.eventType,
    ).toUpperCase();
  }

  let actionLabel = "";
  if (actionEvent) {
    actionLabel = prettifyEventAction(actionEvent.eventType).toUpperCase();
  }

  if (prettifyIsAgentEvent(event)) {
    return [prettifyFormatTag("", agentEvent?.eventId, "🅰")];
  }

  if (prettifyIsStagehandEvent(event)) {
    return [
      prettifyFormatTag("", agentEvent?.eventId, "🅰"),
      prettifyFormatTag(
        prettifyEventAction(
          stagehandEvent?.eventType ?? event.eventType,
        ).toUpperCase(),
        stagehandEvent?.eventId,
        "🆂",
      ),
    ];
  }

  if (prettifyIsActionEvent(event)) {
    return [
      prettifyFormatTag("", agentEvent?.eventId, "🅰"),
      prettifyFormatTag(stagehandLabel, stagehandEvent?.eventId, "🆂"),
      prettifyFormatTag(
        prettifyEventAction(
          actionEvent?.eventType ?? event.eventType,
        ).toUpperCase(),
        actionEvent?.eventId,
        "🆄",
      ),
    ];
  }

  if (prettifyIsCdpEvent(event)) {
    return [
      prettifyFormatTag("", agentEvent?.eventId, "🅰"),
      prettifyFormatTag(stagehandLabel, stagehandEvent?.eventId, "🆂"),
      prettifyFormatTag(actionLabel, actionEvent?.eventId, "🆄"),
      prettifyFormatTag("CDP", targetId, "🅲"),
    ];
  }

  if (prettifyIsLlmEvent(event)) {
    let requestId: string | null = null;
    if (typeof event.data.requestId === "string") {
      requestId = event.data.requestId;
    }

    return [
      prettifyFormatTag("", agentEvent?.eventId, "🅰"),
      prettifyFormatTag(stagehandLabel, stagehandEvent?.eventId, "🆂"),
      prettifyFormatTag("LLM", requestId ?? llmEvent?.eventId, "🅻"),
    ];
  }

  return [`[#${shortId(event.eventId)}]`];
}

// Formats the details section for started/root events.
function prettifyFormatStartedDetails(event: FlowEvent): string {
  const data = event.data as {
    params?: unknown[];
    target?: string;
  };
  const name = prettifyEventName(event.eventType);
  const method = prettifyEventAction(event.eventType);

  if (name.startsWith("Stagehand")) {
    return prettifyFormatMethodCall("Stagehand", method, data.params);
  }

  if (name.startsWith("Page")) {
    return prettifyFormatMethodCall("Page", method, data.params);
  }

  if (name.startsWith("Understudy")) {
    const args = [
      data.target,
      ...(Array.isArray(data.params) ? data.params : []),
    ].filter((entry) => entry !== undefined);
    return prettifyFormatMethodCall("Understudy", method, args);
  }

  if (name.startsWith("Agent")) {
    return `▷ Agent.execute(${prettifyFormatEventArgs(data.params)})`;
  }

  return `${event.eventType}(${prettifyFormatEventArgs(data.params ?? event.data)})`;
}

// Formats the details section for completed/error events.
function prettifyFormatCompletedDetails(event: FlowEvent): string {
  const duration = prettifyFormatDuration(event.data.durationMs);
  const prefix = prettifyIsAgentEvent(event)
    ? "Agent.execute() completed"
    : `${prettifyEventAction(event.eventType).toUpperCase() || event.eventType} completed`;
  const message =
    prettifyIsErrorEvent(event) && typeof event.data.error === "string"
      ? ` ERROR ${event.data.error}`
      : "";
  return `${prettifyIsErrorEvent(event) ? "✕" : "✓"} ${prefix}${duration ? ` in ${duration}` : ""}${message}`;
}

// Formats CDP request/response/message details. These are rendered differently from normal Stagehand lifecycle events because they represent transport-level traffic rather than method envelopes.
function prettifyFormatCdpDetails(event: FlowEvent): string {
  const data = event.data as {
    method?: string;
    params?: unknown;
    result?: unknown;
    error?: string;
  };
  const method = data.method ?? "unknown";
  const icon = event.eventType === "CdpCallEvent" ? "⏵" : "⏴";
  let payload: unknown;
  if (event.eventType === "CdpCallEvent") {
    payload = data.params;
  } else if (data.error) {
    payload = { error: data.error };
  } else if (event.eventType === "CdpMessageEvent") {
    payload = data.params;
  } else {
    payload = data.result;
  }

  return `${icon} ${method}(${prettifyFormatEventArgs(payload)})`;
}

// Formats LLM request/response details for pretty logs.
function prettifyFormatLlmDetails(event: FlowEvent): string {
  const data = event.data as {
    model?: string;
    prompt?: unknown;
    output?: unknown;
    inputTokens?: number;
    outputTokens?: number;
  };
  const model = data.model ?? "llm";

  if (event.eventType === "LlmRequestEvent") {
    const prompt = prettifySummarizePrompt(data.prompt);
    return prompt ? `${model} ⏴ ${prompt}` : `${model} ⏴`;
  }

  const tokenInfo =
    (data.inputTokens || data.outputTokens) > 0
      ? ` ꜛ${data.inputTokens ?? 0} ꜜ${data.outputTokens ?? 0}`
      : "";
  const output = prettifySummarizePrompt(data.output);
  return output ? `${model} ↳${tokenInfo} ${output}` : `${model} ↳${tokenInfo}`;
}

// Converts a flow event into a single pretty log line by combining the current event payload with recent shallow ancestry fetched from the store query sink.
export async function prettifyEvent(
  store: Pick<EventStoreApi, "query">,
  event: FlowEvent,
): Promise<string | null> {
  const recentEvents = await store.query({ limit: 500 });
  const parentMap = new Map(
    recentEvents.map((recentEvent) => [recentEvent.eventId, recentEvent]),
  );
  const tags = prettifyBuildContextTags(event, parentMap);

  let details = prettifyFormatStartedDetails(event);
  if (prettifyIsCdpEvent(event)) {
    details = prettifyFormatCdpDetails(event);
  } else if (prettifyIsLlmEvent(event)) {
    details = prettifyFormatLlmDetails(event);
  } else if (prettifyIsCompletedEvent(event) || prettifyIsErrorEvent(event)) {
    details = prettifyFormatCompletedDetails(event);
  }

  if (!details) {
    return null;
  }

  const createdAt = new Date(event.eventCreatedAt);
  let timestamp = prettifyFormatTimestamp(createdAt);
  if (Number.isNaN(createdAt.getTime())) {
    timestamp = prettifyFormatTimestamp(new Date());
  }

  const line = `${timestamp} ${tags.join(" ")} ${details}`;
  const cleaned = prettifyRemoveQuotes(line);
  const processed = prettifyIsCdpEvent(event)
    ? truncateCdpIds(cleaned)
    : cleaned;
  return prettifyTruncateLine(processed, MAX_LINE_LENGTH);
}

// Adds subtle terminal color to stderr-only pretty lines without affecting file sinks.
export function prettifyColorStderrLine(line: string): string {
  if (
    process.env.NO_COLOR !== undefined ||
    (process.env.FORCE_COLOR ?? "") === "0" ||
    (!process.env.FORCE_COLOR &&
      (!process.stderr.isTTY || process.env.TERM === "dumb"))
  ) {
    return line;
  }

  const color = (code: string, value: string) =>
    `\u001B[${code}m${value}\u001B[0m`;
  return line
    .replace(/^(\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}\.\d{5})/, (_, timestamp) =>
      color("2", timestamp),
    )
    .replace(/\[([🅰🆂🆄🅻🅲])([^\]]*)\]/gu, (_, icon, rest) =>
      color(
        icon === "🅰"
          ? "36"
          : icon === "🆂"
            ? "33"
            : icon === "🆄"
              ? "32"
              : icon === "🅻"
                ? "95"
                : "90",
        `[${icon}${rest}]`,
      ),
    )
    .replace(
      / in (\d+(?:\.\d+)?s)/g,
      (_, duration) => ` ${color("2", "in")} ${color("2", duration)}`,
    )
    .replace(/▷/g, color("96", "▷"))
    .replace(/⏴/g, color("96", "⏴"))
    .replace(/↳/g, color("95", "↳"))
    .replace(/ꜛ/g, color("33", "ꜛ"))
    .replace(/ꜜ/g, color("95", "ꜜ"))
    .replace(/…/g, color("94", "…"))
    .replace(/[(){}=]/g, (char) => color("94", char))
    .replace(
      /([A-Za-z])(\.)([A-Za-z])/g,
      (_, left, dot, right) => `${left}${color("94", dot)}${right}`,
    )
    .replace(/ ✓ /g, ` ${color("32", "✓")} `)
    .replace(/ ✕ /g, ` ${color("31", "✕")} `);
}


================================================
FILE: packages/core/lib/v3/handlers/actHandler.ts
================================================
// lib/v3/handlers/actHandler.ts
import { act as actInference } from "../../inference.js";
import { buildActPrompt, buildStepTwoPrompt } from "../../prompt.js";
import { trimTrailingTextNode } from "../../utils.js";
import { v3Logger } from "../logger.js";
import { ActHandlerParams } from "../types/private/handlers.js";
import { ActResult, Action, V3FunctionName } from "../types/public/methods.js";
import { ActTimeoutError } from "../types/public/sdkErrors.js";
import {
  captureHybridSnapshot,
  diffCombinedTrees,
} from "../understudy/a11y/snapshot/index.js";
import { LLMClient } from "../llm/LLMClient.js";
import { SupportedUnderstudyAction } from "../types/private/index.js";
import { EncodedId } from "../types/private/internal.js";
import {
  AvailableModel,
  ClientOptions,
  ModelConfiguration,
} from "../types/public/model.js";
import type { Variables } from "../types/public/agent.js";
import type { Page } from "../understudy/page.js";
import {
  performUnderstudyMethod,
  waitForDomNetworkQuiet,
} from "./handlerUtils/actHandlerUtils.js";
import { createTimeoutGuard } from "./handlerUtils/timeoutGuard.js";
import { resolveVariableValue } from "../agent/utils/variables.js";

type ActInferenceElement = {
  elementId?: string;
  description: string;
  method?: string;
  arguments?: string[];
};

type ActInferenceResponse = Awaited<ReturnType<typeof actInference>>;

export class ActHandler {
  private readonly llmClient: LLMClient;
  private readonly defaultModelName: AvailableModel;
  private readonly defaultClientOptions: ClientOptions;
  private readonly resolveLlmClient: (model?: ModelConfiguration) => LLMClient;
  private readonly systemPrompt: string;
  private readonly logInferenceToFile: boolean;
  private readonly selfHeal: boolean;
  private readonly onMetrics?: (
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ) => void;
  private readonly defaultDomSettleTimeoutMs?: number;

  constructor(
    llmClient: LLMClient,
    defaultModelName: AvailableModel,
    defaultClientOptions: ClientOptions,
    resolveLlmClient: (model?: ModelConfiguration) => LLMClient,
    systemPrompt?: string,
    logInferenceToFile?: boolean,
    selfHeal?: boolean,
    onMetrics?: (
      functionName: V3FunctionName,
      promptTokens: number,
      completionTokens: number,
      reasoningTokens: number,
      cachedInputTokens: number,
      inferenceTimeMs: number,
    ) => void,
    defaultDomSettleTimeoutMs?: number,
  ) {
    this.llmClient = llmClient;
    this.defaultModelName = defaultModelName;
    this.defaultClientOptions = defaultClientOptions;
    this.resolveLlmClient = resolveLlmClient;
    this.systemPrompt = systemPrompt ?? "";
    this.logInferenceToFile = logInferenceToFile ?? false;
    this.selfHeal = !!selfHeal;
    this.onMetrics = onMetrics;
    this.defaultDomSettleTimeoutMs = defaultDomSettleTimeoutMs;
  }

  private recordActMetrics(response: ActInferenceResponse): void {
    this.onMetrics?.(
      V3FunctionName.ACT,
      response.prompt_tokens ?? 0,
      response.completion_tokens ?? 0,
      response.reasoning_tokens ?? 0,
      response.cached_input_tokens ?? 0,
      response.inference_time_ms ?? 0,
    );
  }

  private async getActionFromLLM({
    instruction,
    domElements,
    xpathMap,
    llmClient,
    requireMethodAndArguments = true,
  }: {
    instruction: string;
    domElements: string;
    xpathMap: Record<string, string>;
    llmClient: LLMClient;
    requireMethodAndArguments?: boolean;
  }): Promise<{ action?: Action; response: ActInferenceResponse }> {
    const response = await actInference({
      instruction,
      domElements,
      llmClient,
      userProvidedInstructions: this.systemPrompt,
      logger: v3Logger,
      logInferenceToFile: this.logInferenceToFile,
    });

    this.recordActMetrics(response);

    const normalized = normalizeActInferenceElement(
      response.element as ActInferenceElement | undefined,
      xpathMap,
      requireMethodAndArguments,
    );

    if (!normalized) {
      return { response };
    }

    return {
      action: { ...normalized } as Action,
      response,
    };
  }

  async act(params: ActHandlerParams): Promise<ActResult> {
    const { instruction, page, variables, timeout, model } = params;

    const llmClient = this.resolveLlmClient(model);
    const ensureTimeRemaining = createTimeoutGuard(
      timeout,
      (ms) => new ActTimeoutError(ms),
    );

    ensureTimeRemaining();
    await waitForDomNetworkQuiet(
      page.mainFrame(),
      this.defaultDomSettleTimeoutMs,
    );
    ensureTimeRemaining();
    const { combinedTree, combinedXpathMap } = await captureHybridSnapshot(
      page,
      { experimental: true },
    );

    const actInstruction = buildActPrompt(
      instruction,
      Object.values(SupportedUnderstudyAction),
      variables,
    );

    ensureTimeRemaining();
    const { action: firstAction, response: actInferenceResponse } =
      await this.getActionFromLLM({
        instruction: actInstruction,
        domElements: combinedTree,
        xpathMap: combinedXpathMap,
        llmClient,
      });

    if (!firstAction) {
      v3Logger({
        category: "action",
        message: "no actionable element returned by LLM",
        level: 1,
      });
      return {
        success: false,
        message: "Failed to perform act: No action found",
        actionDescription: instruction,
        actions: [],
      };
    }

    // First action (self-heal aware path)
    ensureTimeRemaining();
    const firstResult = await this.takeDeterministicAction(
      firstAction,
      page,
      this.defaultDomSettleTimeoutMs,
      llmClient,
      ensureTimeRemaining,
      variables,
    );

    // If not two-step, return the first action result
    if (actInferenceResponse?.twoStep !== true) {
      return firstResult;
    }

    // Take a new focused snapshot and observe again
    ensureTimeRemaining();
    const { combinedTree: combinedTree2, combinedXpathMap: combinedXpathMap2 } =
      await captureHybridSnapshot(page, {
        experimental: true,
      });

    let diffedTree = diffCombinedTrees(combinedTree, combinedTree2);
    if (!diffedTree.trim()) {
      // Fallback: if no diff detected, use the fresh tree to avoid empty context
      diffedTree = combinedTree2;
    }

    const previousAction = `method: ${firstAction.method}, description: ${firstAction.description}, arguments: ${firstAction.arguments}`;

    const stepTwoInstructions = buildStepTwoPrompt(
      instruction,
      previousAction,
      Object.values(SupportedUnderstudyAction).filter(
        (
          action,
        ): action is Exclude<
          SupportedUnderstudyAction,
          SupportedUnderstudyAction.SELECT_OPTION_FROM_DROPDOWN
        > => action !== SupportedUnderstudyAction.SELECT_OPTION_FROM_DROPDOWN,
      ),
      variables,
    );

    ensureTimeRemaining();
    const { action: secondAction } = await this.getActionFromLLM({
      instruction: stepTwoInstructions,
      domElements: diffedTree,
      xpathMap: combinedXpathMap2,
      llmClient,
    });

    if (!secondAction) {
      // No second action found — return first result as-is
      return firstResult;
    }

    ensureTimeRemaining();
    const secondResult = await this.takeDeterministicAction(
      secondAction,
      page,
      this.defaultDomSettleTimeoutMs,
      llmClient,
      ensureTimeRemaining,
      variables,
    );

    // Combine results
    return {
      success: firstResult.success && secondResult.success,
      message: secondResult.success
        ? `${firstResult.message} → ${secondResult.message}`
        : `${firstResult.message} → ${secondResult.message}`,
      actionDescription: firstResult.actionDescription,
      actions: [
        ...(firstResult.actions || []),
        ...(secondResult.actions || []),
      ],
    };
  }

  async takeDeterministicAction(
    action: Action,
    page: Page,
    domSettleTimeoutMs?: number,
    llmClientOverride?: LLMClient,
    ensureTimeRemaining?: () => void,
    variables?: Variables,
  ): Promise<ActResult> {
    ensureTimeRemaining?.();
    const settleTimeout = domSettleTimeoutMs ?? this.defaultDomSettleTimeoutMs;
    const effectiveClient = llmClientOverride ?? this.llmClient;
    const method = action.method?.trim();
    if (!method || method === "not-supported") {
      v3Logger({
        category: "action",
        message: "action has no supported method",
        level: 0,
        auxiliary: {
          act: { value: JSON.stringify(action), type: "object" },
        },
      });
      return {
        success: false,
        message: `Unable to perform action: The method '${method ?? ""}' is not supported in Action. Please use a supported Playwright locator method.`,
        actionDescription:
          action.description || `Action (${method ?? "unknown"})`,
        actions: [],
      };
    }

    const placeholderArgs = Array.isArray(action.arguments)
      ? [...action.arguments]
      : [];
    const resolvedArgs =
      substituteVariablesInArguments(action.arguments, variables) ?? [];

    try {
      ensureTimeRemaining?.();
      await performUnderstudyMethod(
        page,
        page.mainFrame(),
        method,
        action.selector,
        resolvedArgs,
        settleTimeout,
      );
      return {
        success: true,
        message: `Action [${method}] performed successfully on selector: ${action.selector}`,
        actionDescription: action.description || `action (${method})`,
        actions: [
          {
            selector: action.selector,
            description: action.description || `action (${method})`,
            method,
            arguments: placeholderArgs,
          },
        ],
      };
    } catch (err) {
      if (err instanceof ActTimeoutError) {
        throw err;
      }
      const msg = err instanceof Error ? err.message : String(err);

      // Attempt self-heal: rerun actInference and retry with updated selector
      if (this.selfHeal) {
        v3Logger({
          category: "action",
          message:
            "Error performing action. Reprocessing the page and trying again",
          level: 1,
          auxiliary: {
            error: { value: msg, type: "string" },
            action: {
              value: JSON.stringify(action),
              type: "object",
            },
          },
        });

        try {
          // Build an instruction combining method + description, avoiding duplication
          const actCommand = action.description
            ? action.description.toLowerCase().startsWith(method.toLowerCase())
              ? action.description
              : `${method} ${action.description}`
            : method;

          // Take a fresh snapshot and ask for a new actionable element
          ensureTimeRemaining?.();
          const { combinedTree, combinedXpathMap } =
            await captureHybridSnapshot(page, {
              experimental: true,
            });

          const instruction = buildActPrompt(
            actCommand,
            Object.values(SupportedUnderstudyAction),
            {},
          );

          ensureTimeRemaining?.();
          const { action: fallbackAction, response: fallbackResponse } =
            await this.getActionFromLLM({
              instruction,
              domElements: combinedTree,
              xpathMap: combinedXpathMap,
              llmClient: effectiveClient,
              requireMethodAndArguments: false,
            });

          const fallbackElement = fallbackResponse.element;
          if (!fallbackElement) {
            return {
              success: false,
              message:
                "Failed to self-heal act: No observe results found for action",
              actionDescription: actCommand,
              actions: [],
            };
          }

          // Retry with original method/args but new selector from fallback
          let newSelector = action.selector;
          if (fallbackAction?.selector) {
            newSelector = fallbackAction.selector;
          }

          ensureTimeRemaining?.();
          await performUnderstudyMethod(
            page,
            page.mainFrame(),
            method,
            newSelector,
            resolvedArgs,
            settleTimeout,
          );

          return {
            success: true,
            message: `Action [${method}] performed successfully on selector: ${newSelector}`,
            actionDescription: action.description || `action (${method})`,
            actions: [
              {
                selector: newSelector,
                description: action.description || `action (${method})`,
                method,
                arguments: placeholderArgs,
              },
            ],
          };
        } catch (retryErr) {
          if (retryErr instanceof ActTimeoutError) {
            throw retryErr;
          }
          const retryMsg =
            retryErr instanceof Error ? retryErr.message : String(retryErr);
          return {
            success: false,
            message: `Failed to perform act after self-heal: ${retryMsg}`,
            actionDescription: action.description || `action (${method})`,
            actions: [],
          };
        }
      }

      return {
        success: false,
        message: `Failed to perform act: ${msg}`,
        actionDescription: action.description || `action (${method})`,
        actions: [],
      };
    }
  }
}

function normalizeActInferenceElement(
  element: ActInferenceElement | undefined,
  xpathMap: Record<string, string>,
  requireMethodAndArguments = true,
): Action | undefined {
  if (!element) {
    return undefined;
  }
  const { elementId, description, method, arguments: args } = element;
  const hasArgs = Array.isArray(args);

  if (
    requireMethodAndArguments &&
    (!method || method === "not-supported" || !hasArgs)
  ) {
    return undefined;
  }

  if (typeof elementId !== "string" || !elementId.includes("-")) {
    return undefined;
  }

  const xp = xpathMap[elementId as EncodedId];
  const trimmed = trimTrailingTextNode(xp);
  if (!trimmed) {
    return undefined;
  }

  // For dragAndDrop, convert element ID in arguments to xpath (target element)
  let resolvedArgs = hasArgs ? args : undefined;
  if (method === "dragAndDrop" && hasArgs && args.length > 0) {
    const targetArg = args[0];
    // Check if argument looks like an element ID (e.g., "1-67")
    if (typeof targetArg === "string" && /^\d+-\d+$/.test(targetArg)) {
      const argXpath = xpathMap[targetArg as EncodedId];
      const trimmedArgXpath = trimTrailingTextNode(argXpath);
      if (trimmedArgXpath) {
        resolvedArgs = [`xpath=${trimmedArgXpath}`, ...args.slice(1)];
      } else {
        // Target element lookup failed, filter out this action
        v3Logger({
          category: "action",
          message: "dragAndDrop target element lookup failed",
          level: 1,
          auxiliary: {
            targetElementId: { value: targetArg, type: "string" },
            sourceElementId: { value: elementId, type: "string" },
          },
        });
        return undefined;
      }
    } else {
      v3Logger({
        category: "action",
        message: "dragAndDrop target element invalid ID format",
        level: 0,
        auxiliary: {
          targetElementId: { value: String(targetArg), type: "string" },
          sourceElementId: { value: elementId, type: "string" },
        },
      });
      return undefined;
    }
  }

  return {
    description,
    method,
    arguments: resolvedArgs,
    selector: `xpath=${trimmed}`,
  } as Action;
}

function substituteVariablesInArguments(
  args: string[] | undefined,
  variables?: Variables,
): string[] | undefined {
  if (!variables || !Array.isArray(args)) {
    return args;
  }

  return args.map((arg: string) => {
    let out = arg;
    for (const [key, v] of Object.entries(variables)) {
      const token = `%${key}%`;
      out = out.split(token).join(resolveVariableValue(v));
    }
    return out;
  });
}


================================================
FILE: packages/core/lib/v3/handlers/extractHandler.ts
================================================
// lib/v3/handlers/extractHandler.ts
import { extract as runExtract } from "../../inference.js";
import {
  getZFactory,
  getZodType,
  injectUrls,
  transformSchema,
} from "../../utils.js";
import { v3Logger } from "../logger.js";
import { V3FunctionName } from "../types/public/methods.js";
import { captureHybridSnapshot } from "../understudy/a11y/snapshot/index.js";
import type { ZodTypeAny } from "zod";
import { LLMClient } from "../llm/LLMClient.js";
import { ExtractHandlerParams } from "../types/private/handlers.js";
import { EncodedId, ZodPathSegments } from "../types/private/internal.js";
import {
  defaultExtractSchema,
  pageTextSchema,
} from "../types/public/methods.js";
import {
  AvailableModel,
  ClientOptions,
  ModelConfiguration,
} from "../types/public/model.js";
import {
  StagehandInvalidArgumentError,
  ExtractTimeoutError,
} from "../types/public/sdkErrors.js";
import { createTimeoutGuard } from "./handlerUtils/timeoutGuard.js";
import type {
  InferStagehandSchema,
  StagehandZodObject,
  StagehandZodSchema,
} from "../zodCompat.js";

/**
 * Scans the provided Zod schema for any `z.string().url()` fields and
 * replaces them with `z.number()`.
 *
 * @param schema - The Zod object schema to transform.
 * @returns A tuple containing:
 *   1. The transformed schema (or the original schema if no changes were needed).
 *   2. An array of {@link ZodPathSegments} objects representing all the replaced URL fields,
 *      with each path segment showing where in the schema the replacement occurred.
 */
export function transformUrlStringsToNumericIds<T extends StagehandZodSchema>(
  schema: T,
): [StagehandZodSchema, ZodPathSegments[]] {
  const [finalSchema, urlPaths] = transformSchema(schema, []);
  return [finalSchema, urlPaths];
}

interface ExtractionResponseBase {
  metadata: { completed: boolean };
  prompt_tokens: number;
  completion_tokens: number;
  reasoning_tokens: number;
  cached_input_tokens?: number;
  inference_time_ms: number;
}

type ExtractionResponse<T extends StagehandZodObject> = ExtractionResponseBase &
  InferStagehandSchema<T>;

export class ExtractHandler {
  private readonly llmClient: LLMClient;
  private readonly defaultModelName: AvailableModel;
  private readonly defaultClientOptions: ClientOptions;
  private readonly resolveLlmClient: (model?: ModelConfiguration) => LLMClient;
  private readonly systemPrompt: string;
  private readonly logInferenceToFile: boolean;
  private readonly experimental: boolean;
  private readonly onMetrics?: (
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ) => void;

  constructor(
    llmClient: LLMClient,
    defaultModelName: AvailableModel,
    defaultClientOptions: ClientOptions,
    resolveLlmClient: (model?: ModelConfiguration) => LLMClient,
    systemPrompt?: string,
    logInferenceToFile?: boolean,
    experimental?: boolean,
    onMetrics?: (
      functionName: V3FunctionName,
      promptTokens: number,
      completionTokens: number,
      reasoningTokens: number,
      cachedInputTokens: number,
      inferenceTimeMs: number,
    ) => void,
  ) {
    this.llmClient = llmClient;
    this.defaultModelName = defaultModelName;
    this.defaultClientOptions = defaultClientOptions;
    this.resolveLlmClient = resolveLlmClient;
    this.systemPrompt = systemPrompt ?? "";
    this.logInferenceToFile = logInferenceToFile ?? false;
    this.experimental = experimental ?? false;
    this.onMetrics = onMetrics;
  }

  async extract<T extends StagehandZodSchema>(
    params: ExtractHandlerParams<T>,
  ): Promise<InferStagehandSchema<T> | { pageText: string }> {
    const { instruction, schema, page, selector, timeout, model } = params;

    const llmClient = this.resolveLlmClient(model);

    const ensureTimeRemaining = createTimeoutGuard(
      timeout,
      (ms) => new ExtractTimeoutError(ms),
    );

    // No-args → page text (parity with v2)
    const noArgs = !instruction && !schema;
    if (noArgs) {
      const focusSelector = selector?.replace(/^xpath=/i, "") ?? "";
      ensureTimeRemaining();
      const snap = await captureHybridSnapshot(page, {
        experimental: this.experimental,
        focusSelector: focusSelector || undefined,
      });
      ensureTimeRemaining();

      const result = { pageText: snap.combinedTree };
      // Validate via the same schema used in v2
      return pageTextSchema.parse(result);
    }

    if (!instruction && schema) {
      throw new StagehandInvalidArgumentError(
        "extract() requires an instruction when a schema is provided.",
      );
    }

    const focusSelector = selector?.replace(/^xpath=/, "") ?? "";

    // Build the hybrid snapshot (includes combinedTree; combinedUrlMap optional)
    ensureTimeRemaining();
    const { combinedTree, combinedUrlMap } = await captureHybridSnapshot(page, {
      experimental: this.experimental,
      focusSelector: focusSelector,
    });

    v3Logger({
      category: "extraction",
      message: "Starting extraction using a11y snapshot",
      level: 1,
      auxiliary: instruction
        ? { instruction: { value: instruction, type: "string" } }
        : undefined,
    });

    // Normalize schema: if instruction provided without schema, use defaultExtractSchema
    const baseSchema: StagehandZodSchema = (schema ??
      defaultExtractSchema) as StagehandZodSchema;
    // Ensure we pass an object schema into inference; wrap non-object schemas
    const isObjectSchema = getZodType(baseSchema) === "object";
    const WRAP_KEY = "value" as const;
    const factory = getZFactory(baseSchema);
    const objectSchema: StagehandZodObject = isObjectSchema
      ? (baseSchema as StagehandZodObject)
      : (factory.object({
          [WRAP_KEY]: baseSchema as ZodTypeAny,
        }) as StagehandZodObject);

    const [transformedSchema, urlFieldPaths] =
      transformUrlStringsToNumericIds(objectSchema);

    ensureTimeRemaining();
    const extractionResponse: ExtractionResponse<StagehandZodObject> =
      await runExtract<StagehandZodObject>({
        instruction,
        domElements: combinedTree,
        schema: transformedSchema as StagehandZodObject,
        llmClient,
        userProvidedInstructions: this.systemPrompt,
        logger: v3Logger,
        logInferenceToFile: this.logInferenceToFile,
      });

    const {
      metadata: { completed },
      prompt_tokens,
      completion_tokens,
      reasoning_tokens = 0,
      cached_input_tokens = 0,
      inference_time_ms,
      ...rest
    } = extractionResponse;
    let output = rest as InferStagehandSchema<StagehandZodObject>;

    // Update EXTRACT metrics from the LLM calls
    this.onMetrics?.(
      V3FunctionName.EXTRACT,
      prompt_tokens,
      completion_tokens,
      reasoning_tokens,
      cached_input_tokens,
      inference_time_ms,
    );

    // Re-inject URLs for any url() fields we temporarily converted to number()
    const idToUrl: Record<EncodedId, string> = (combinedUrlMap ?? {}) as Record<
      EncodedId,
      string
    >;
    for (const { segments } of urlFieldPaths) {
      injectUrls(
        output as Record<string, unknown>,
        segments,
        idToUrl as unknown as Record<string, string>,
      );
    }
    // If we wrapped a non-object schema, unwrap the value
    if (!isObjectSchema && output && typeof output === "object") {
      output = (output as Record<string, unknown>)[WRAP_KEY];
    }

    const resultPreviewLength = 200;
    const resultString = JSON.stringify(output) ?? "undefined";
    const resultPreview =
      resultString.length > resultPreviewLength
        ? resultString.slice(0, resultPreviewLength) + "..."
        : resultString;

    v3Logger({
      category: "extraction",
      message: completed
        ? "Extraction completed successfully"
        : "Extraction incomplete after processing all data",
      level: 1,
      auxiliary: {
        prompt_tokens: { value: String(prompt_tokens), type: "string" },
        completion_tokens: { value: String(completion_tokens), type: "string" },
        inference_time_ms: {
          value: String(inference_time_ms),
          type: "string",
        },
        result: { value: resultPreview, type: "string" },
      },
    });

    return output as InferStagehandSchema<T>;
  }
}


================================================
FILE: packages/core/lib/v3/handlers/handlerUtils/actHandlerUtils.ts
================================================
// lib/v3/handlers/handlerUtils/actHandlerUtils.ts
import { Protocol } from "devtools-protocol";
import { Frame } from "../../understudy/frame.js";
import { Locator } from "../../understudy/locator.js";
import { MouseButton } from "../../types/public/locator.js";
import { resolveLocatorWithHops } from "../../understudy/deepLocator.js";
import type { Page } from "../../understudy/page.js";
import { v3Logger } from "../../logger.js";
import { FlowLogger } from "../../flowlogger/FlowLogger.js";
import { toTitleCase } from "../../../utils.js";
import {
  StagehandClickError,
  UnderstudyCommandException,
} from "../../types/public/sdkErrors.js";

export interface UnderstudyMethodHandlerContext {
  method: string;
  locator: Locator;
  xpath: string;
  args: ReadonlyArray<string>;
  frame: Frame;
  page: Page;
  initialUrl: string;
  domSettleTimeoutMs?: number;
}

// Normalize cases where the XPath is the root "/" to point to the HTML element.
function normalizeRootXPath(input: string): string {
  const s = String(input ?? "").trim();
  if (s === "/") return "/html";
  if (/^xpath=\/$/i.test(s)) return "xpath=/html";
  return s;
}

export async function performUnderstudyMethod(
  page: Page,
  frame: Frame,
  method: string,
  rawXPath: string,
  args: ReadonlyArray<unknown>,
  domSettleTimeoutMs?: number,
): Promise<void> {
  const selectorRaw = normalizeRootXPath(rawXPath);

  try {
    await FlowLogger.runWithLogging(
      {
        eventType: `Understudy${toTitleCase(method)}`, // e.g. "UnderstudyClick"
        data: {
          target: selectorRaw,
        },
      },
      async () => {
        // Unified resolver: supports '>>' hops and XPath across iframes.
        const locator: Locator = await resolveLocatorWithHops(
          page,
          frame,
          selectorRaw,
        );
        const initialUrl = await getFrameUrl(frame);

        v3Logger({
          category: "action",
          message: "performing understudy method",
          level: 2,
          auxiliary: {
            xpath: { value: selectorRaw, type: "string" },
            method: { value: method, type: "string" },
            url: { value: initialUrl, type: "string" },
          },
        });

        const ctx: UnderstudyMethodHandlerContext = {
          method,
          locator,
          xpath: selectorRaw,
          args: args.map((a) => (a == null ? "" : String(a))),
          frame,
          page,
          initialUrl,
          domSettleTimeoutMs,
        };
        const handler = METHOD_HANDLER_MAP[method] ?? null;

        if (handler) {
          await handler(ctx);
          return;
        }

        v3Logger({
          category: "action",
          message: "chosen method is invalid",
          level: 1,
          auxiliary: { method: { value: method, type: "string" } },
        });
        throw new UnderstudyCommandException(`Method ${method} not supported`);
      },
      args,
    );
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    const stack = e instanceof Error ? e.stack : undefined;
    v3Logger({
      category: "action",
      message: "error performing method",
      level: 1,
      auxiliary: {
        error: { value: msg, type: "string" },
        trace: { value: stack ?? "", type: "string" },
        method: { value: method, type: "string" },
        xpath: { value: selectorRaw, type: "string" },
        args: { value: JSON.stringify(args), type: "object" },
      },
    });
    if (e instanceof UnderstudyCommandException) {
      throw e;
    }
    throw new UnderstudyCommandException(msg, e);
  }
}

/* ===================== Handlers & Map ===================== */

const METHOD_HANDLER_MAP: Record<
  string,
  (ctx: UnderstudyMethodHandlerContext) => Promise<void>
> = {
  scrollIntoView,
  scrollByPixelOffset,
  scrollTo: scrollElementToPercentage,
  scroll: scrollElementToPercentage,
  "mouse.wheel": wheelScroll,
  fill: fillOrType,
  type: typeText,
  press: pressKey,
  click: clickElement,
  doubleClick,
  dragAndDrop,
  nextChunk: scrollToNextChunk,
  prevChunk: scrollToPreviousChunk,
  selectOptionFromDropdown: selectOption,
  selectOption: selectOption,
  hover: hover,
};

export async function selectOption(ctx: UnderstudyMethodHandlerContext) {
  const { locator, xpath, args } = ctx;
  try {
    const text = args[0]?.toString() || "";
    await locator.selectOption(text);
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    const stack = e instanceof Error ? e.stack : undefined;
    v3Logger({
      category: "action",
      message: "error selecting option",
      level: 0,
      auxiliary: {
        error: { value: msg, type: "string" },
        trace: { value: stack ?? "", type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

async function scrollIntoView(
  ctx: UnderstudyMethodHandlerContext,
): Promise<void> {
  const { locator, xpath } = ctx;
  v3Logger({
    category: "action",
    message: "scrolling element into view",
    level: 2,
    auxiliary: { xpath: { value: xpath, type: "string" } },
  });
  const { objectId } = await locator.resolveNode();
  const ownerSession = locator.getFrame().session;
  await ownerSession.send("DOM.scrollIntoViewIfNeeded", { objectId });
  await ownerSession
    .send("Runtime.releaseObject", { objectId })
    .catch(() => {});
}

async function scrollElementToPercentage(
  ctx: UnderstudyMethodHandlerContext,
): Promise<void> {
  const { locator, xpath, args } = ctx;
  v3Logger({
    category: "action",
    message: "scrolling element vertically to specified percentage",
    level: 2,
    auxiliary: {
      xpath: { value: xpath, type: "string" },
      coordinate: { value: JSON.stringify(args), type: "string" },
    },
  });

  const [yArg = "0%"] = args;
  await locator.scrollTo(yArg);
}

/** Scroll the page by pixel offset, starting from the element's center. */
async function scrollByPixelOffset(
  ctx: UnderstudyMethodHandlerContext,
): Promise<void> {
  const { locator, page, args } = ctx;
  const dx = Number(args[0] ?? 0);
  const dy = Number(args[1] ?? 0);

  try {
    const { x, y } = await locator.centroid();
    await page.scroll(x, y, dx, dy);
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    throw new UnderstudyCommandException(msg, e);
  }
}

async function wheelScroll(ctx: UnderstudyMethodHandlerContext): Promise<void> {
  const { frame, args } = ctx;
  const deltaY = Number(args[0] ?? 200);
  v3Logger({
    category: "action",
    message: "dispatching mouse wheel",
    level: 2,
    auxiliary: { deltaY: { value: String(deltaY), type: "string" } },
  });
  await frame.session.send<never>("Input.dispatchMouseEvent", {
    type: "mouseWheel",
    x: 0,
    y: 0,
    deltaY,
    deltaX: 0,
  } as Protocol.Input.DispatchMouseEventRequest);
}

async function fillOrType(ctx: UnderstudyMethodHandlerContext): Promise<void> {
  const { locator, xpath, args } = ctx;
  try {
    await locator.fill(""); // clear
    await locator.fill(args[0] ?? "");
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    v3Logger({
      category: "action",
      message: "error filling element",
      level: 1,
      auxiliary: {
        error: { value: msg, type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

async function typeText(ctx: UnderstudyMethodHandlerContext): Promise<void> {
  const { locator, xpath, args } = ctx;
  try {
    await locator.type(args[0] ?? "");
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    v3Logger({
      category: "action",
      message: "error typing into element",
      level: 1,
      auxiliary: {
        error: { value: msg, type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

async function pressKey(ctx: UnderstudyMethodHandlerContext): Promise<void> {
  const { args, xpath, page } = ctx;
  const key = args[0] ?? "";
  try {
    v3Logger({
      category: "action",
      message: "pressing key",
      level: 1,
      auxiliary: {
        key: { value: key, type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    await page.keyPress(key);
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    v3Logger({
      category: "action",
      message: "error pressing key",
      level: 1,
      auxiliary: {
        error: { value: msg, type: "string" },
        key: { value: key, type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

async function clickElement(
  ctx: UnderstudyMethodHandlerContext,
): Promise<void> {
  const { locator, xpath, args } = ctx;
  try {
    await locator.click({ button: (args[0] as MouseButton) || undefined });
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    v3Logger({
      category: "action",
      message: "error performing click",
      level: 0,
      auxiliary: {
        error: { value: msg, type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new StagehandClickError(ctx.xpath, msg);
  }
}

async function doubleClick(ctx: UnderstudyMethodHandlerContext): Promise<void> {
  const { locator, xpath } = ctx;
  try {
    await locator.click({ clickCount: 2 });
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    v3Logger({
      category: "action",
      message: "error performing doubleClick",
      level: 0,
      auxiliary: {
        error: { value: msg, type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

async function dragAndDrop(ctx: UnderstudyMethodHandlerContext): Promise<void> {
  const { page, frame, locator, args, xpath } = ctx;
  const toXPath = String(args[0] ?? "").trim();
  if (!toXPath)
    throw new UnderstudyCommandException(
      "dragAndDrop requires a target XPath arg",
    );

  const targetLocator = await resolveLocatorWithHops(page, frame, toXPath);

  try {
    // 1) Centers in local (owning-frame) viewport
    const { x: fromLocalX, y: fromLocalY } = await locator.centroid();
    const { x: toLocalX, y: toLocalY } = await targetLocator.centroid();

    // 2) Convert to main-viewport absolute coordinates
    const fromAbs = await locator
      .getFrame()
      .evaluate<{ x: number; y: number }, { x: number; y: number }>(
        ({ x, y }: { x: number; y: number }) => {
          let X = x;
          let Y = y;
          let w: Window = window;
          while (w !== w.top) {
            const fe = w.frameElement as HTMLElement | null;
            if (!fe) break;
            const r = fe.getBoundingClientRect();
            X += r.left;
            Y += r.top;
            w = w.parent as Window;
          }
          return { x: Math.round(X), y: Math.round(Y) };
        },
        { x: fromLocalX, y: fromLocalY },
      );

    const toAbs = await targetLocator
      .getFrame()
      .evaluate<{ x: number; y: number }, { x: number; y: number }>(
        ({ x, y }: { x: number; y: number }) => {
          let X = x;
          let Y = y;
          let w: Window = window;
          while (w !== w.top) {
            const fe = w.frameElement as HTMLElement | null;
            if (!fe) break;
            const r = fe.getBoundingClientRect();
            X += r.left;
            Y += r.top;
            w = w.parent as Window;
          }
          return { x: Math.round(X), y: Math.round(Y) };
        },
        { x: toLocalX, y: toLocalY },
      );

    // 3) Perform drag in main session
    await page.dragAndDrop(fromAbs.x, fromAbs.y, toAbs.x, toAbs.y, {
      steps: 10,
      delay: 5,
    });
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    v3Logger({
      category: "action",
      message: "error performing dragAndDrop",
      level: 0,
      auxiliary: {
        error: { value: msg, type: "string" },
        from: { value: xpath, type: "string" },
        to: { value: toXPath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

async function scrollToNextChunk(
  ctx: UnderstudyMethodHandlerContext,
): Promise<void> {
  await scrollByElementHeight(ctx, /*dir=*/ 1);
}

async function scrollToPreviousChunk(
  ctx: UnderstudyMethodHandlerContext,
): Promise<void> {
  await scrollByElementHeight(ctx, /*dir=*/ -1);
}

async function scrollByElementHeight(
  ctx: UnderstudyMethodHandlerContext,
  direction: 1 | -1,
): Promise<void> {
  const { locator, xpath } = ctx;
  v3Logger({
    category: "action",
    message:
      direction > 0 ? "scrolling to next chunk" : "scrolling to previous chunk",
    level: 2,
    auxiliary: { xpath: { value: xpath, type: "string" } },
  });

  const { objectId } = await locator.resolveNode();
  try {
    const ownerSession = locator.getFrame().session;
    await ownerSession.send<Protocol.Runtime.CallFunctionOnResponse>(
      "Runtime.callFunctionOn",
      {
        objectId,
        functionDeclaration: `
          function(dir) {
            const waitForScrollEnd = (el) => new Promise((resolve) => {
              let last = el.scrollTop ?? 0;
              const check = () => {
                const cur = el.scrollTop ?? 0;
                if (cur === last) return resolve();
                last = cur;
                requestAnimationFrame(check);
              };
              requestAnimationFrame(check);
            });

            const tag = this.tagName?.toLowerCase();
            if (tag === "html" || tag === "body") {
              const h = window.visualViewport?.height ?? window.innerHeight;
              window.scrollBy({ top: h * dir, left: 0, behavior: "smooth" });
              const root = document.scrollingElement ?? document.documentElement;
              return waitForScrollEnd(root);
            }
            const h = this.getBoundingClientRect().height;
            this.scrollBy({ top: h * dir, left: 0, behavior: "smooth" });
            return waitForScrollEnd(this);
          }
        `,
        arguments: [{ value: direction }],
        awaitPromise: true,
        returnByValue: true,
      },
    );
  } finally {
    const ownerSession = locator.getFrame().session;
    await ownerSession
      .send("Runtime.releaseObject", { objectId })
      .catch(() => {});
  }
}

export async function hover(ctx: UnderstudyMethodHandlerContext) {
  const { locator, xpath } = ctx;
  try {
    await locator.hover();
  } catch (e) {
    const msg = e instanceof Error ? e.message : String(e);
    const stack = e instanceof Error ? e.stack : undefined;
    v3Logger({
      category: "action",
      message: "error attempting to hover",
      level: 0,
      auxiliary: {
        error: { value: msg, type: "string" },
        trace: { value: stack ?? "", type: "string" },
        xpath: { value: xpath, type: "string" },
      },
    });
    throw new UnderstudyCommandException(msg, e);
  }
}

/* ===================== Helpers ===================== */

async function getFrameUrl(frame: Frame): Promise<string> {
  // Evaluate from within the frame's isolated world
  const url = await frame.evaluate<string>("location.href");
  return url;
}

/**
 * More robust DOM settle using Network + Page events to detect network quiet.
 * Closely modeled after the provided snippet, adapted to our Frame/session + logger.
 */
export async function waitForDomNetworkQuiet(
  frame: Frame,
  timeoutMs?: number,
): Promise<void> {
  const overallTimeout =
    typeof timeoutMs === "number" && Number.isFinite(timeoutMs)
      ? Math.max(0, timeoutMs)
      : 5_000;
  const client = frame.session;
  const settleStart = Date.now();

  // Ensure a document exists; if not, wait for DOMContentLoaded on this frame.
  let hasDoc: boolean;
  try {
    const rs = await frame.evaluate<string>("document.readyState");
    hasDoc = rs === "interactive" || rs === "complete";
  } catch {
    hasDoc = false;
  }
  if (!hasDoc && overallTimeout > 0) {
    await frame
      .waitForLoadState("domcontentloaded", overallTimeout)
      .catch(() => {});
  }

  const elapsed = Date.now() - settleStart;
  const remainingBudget = Math.max(0, overallTimeout - elapsed);
  if (remainingBudget === 0) {
    return;
  }

  await client.send("Network.enable").catch(() => {});
  await client.send("Page.enable").catch(() => {});
  // Best-effort; some sessions may not support Target.setAutoAttach here.
  await client
    .send("Target.setAutoAttach", {
      autoAttach: true,
      waitForDebuggerOnStart: false,
      flatten: true,
      filter: [
        { type: "worker", exclude: true },
        { type: "shared_worker", exclude: true },
      ],
    })
    .catch(() => {});

  return new Promise<void>((resolve) => {
    const inflight = new Set<string>();
    const meta = new Map<string, { url: string; start: number }>();
    const docByFrame = new Map<string, string>();

    let quietTimer: NodeJS.Timeout | null = null;
    let stalledRequestSweepTimer: NodeJS.Timeout | null = null;

    const clearQuiet = () => {
      if (quietTimer) {
        clearTimeout(quietTimer);
        quietTimer = null;
      }
    };

    const maybeQuiet = () => {
      if (inflight.size === 0 && !quietTimer)
        quietTimer = setTimeout(() => resolveDone(), 500);
    };

    const finishReq = (id: string) => {
      if (!inflight.delete(id)) return;
      meta.delete(id);
      for (const [fid, rid] of docByFrame)
        if (rid === id) docByFrame.delete(fid);
      clearQuiet();
      maybeQuiet();
    };

    const onRequest = (p: Protocol.Network.RequestWillBeSentEvent) => {
      // Ignore long-lived streams
      // ResourceType includes: Document, XHR, Fetch, WebSocket, EventSource, etc.
      if (p.type === "WebSocket" || p.type === "EventSource") return;

      inflight.add(p.requestId);
      meta.set(p.requestId, { url: p.request.url, start: Date.now() });

      if (p.type === "Document" && p.frameId)
        docByFrame.set(p.frameId, p.requestId);

      clearQuiet();
    };

    const onFinish = (p: { requestId: string }) => finishReq(p.requestId);
    const onCached = (p: { requestId: string }) => finishReq(p.requestId);
    const onDataUrl = (p: Protocol.Network.ResponseReceivedEvent) => {
      if (p.response.url?.startsWith("data:")) finishReq(p.requestId);
    };

    const onFrameStop = (f: Protocol.Page.FrameStoppedLoadingEvent) => {
      const id = docByFrame.get(f.frameId);
      if (id) finishReq(id);
    };

    client.on("Network.requestWillBeSent", onRequest);
    client.on("Network.loadingFinished", onFinish);
    client.on("Network.loadingFailed", onFinish);
    client.on("Network.requestServedFromCache", onCached);
    client.on("Network.responseReceived", onDataUrl);
    client.on("Page.frameStoppedLoading", onFrameStop);

    stalledRequestSweepTimer = setInterval(() => {
      const now = Date.now();
      for (const [id, m] of meta) {
        if (now - m.start > 2_000) {
          inflight.delete(id);
          meta.delete(id);
          v3Logger({
            category: "dom",
            message: "⏳ forcing completion of stalled iframe document",
            level: 1,
            auxiliary: {
              url: { value: (m.url ?? "").slice(0, 120), type: "string" },
            },
          });
        }
      }
      maybeQuiet();
    }, 500);

    maybeQuiet();

    const guard = setTimeout(() => {
      if (inflight.size) {
        v3Logger({
          category: "dom",
          message:
            "⚠️ DOM-settle timeout reached – network requests still pending",
          level: 1,
          auxiliary: {
            count: { value: String(inflight.size), type: "integer" },
          },
        });
      }
      resolveDone();
    }, remainingBudget);

    const resolveDone = () => {
      client.off("Network.requestWillBeSent", onRequest);
      client.off("Network.loadingFinished", onFinish);
      client.off("Network.loadingFailed", onFinish);
      client.off("Network.requestServedFromCache", onCached);
      client.off("Network.responseReceived", onDataUrl);
      client.off("Page.frameStoppedLoading", onFrameStop);
      if (quietTimer) clearTimeout(quietTimer);
      if (stalledRequestSweepTimer) clearInterval(stalledRequestSweepTimer);
      clearTimeout(guard);
      resolve();
    };
  });
}


================================================
FILE: packages/core/lib/v3/handlers/handlerUtils/timeoutGuard.ts
================================================
import { TimeoutError } from "../../types/public/sdkErrors.js";

export type TimeoutGuard = () => void;

export function createTimeoutGuard(
  timeoutMs?: number,
  errorFactory?: (timeoutMs: number) => Error,
): TimeoutGuard {
  if (!timeoutMs || timeoutMs <= 0) {
    return () => {};
  }

  const startTime = Date.now();
  return () => {
    if (Date.now() - startTime >= timeoutMs) {
      const err =
        errorFactory?.(timeoutMs) ?? new TimeoutError("operation", timeoutMs);
      throw err;
    }
  };
}


================================================
FILE: packages/core/lib/v3/handlers/observeHandler.ts
================================================
// lib/v3/handlers/observeHandler.ts
import { observe as runObserve } from "../../inference.js";
import { trimTrailingTextNode } from "../../utils.js";
import { v3Logger } from "../logger.js";
import { V3FunctionName } from "../types/public/methods.js";
import { captureHybridSnapshot } from "../understudy/a11y/snapshot/index.js";
import { LLMClient } from "../llm/LLMClient.js";
import {
  ObserveHandlerParams,
  SupportedUnderstudyAction,
} from "../types/private/handlers.js";
import { EncodedId } from "../types/private/internal.js";
import { Action } from "../types/public/methods.js";
import {
  AvailableModel,
  ClientOptions,
  ModelConfiguration,
} from "../types/public/model.js";
import { ObserveTimeoutError } from "../types/public/sdkErrors.js";
import { createTimeoutGuard } from "./handlerUtils/timeoutGuard.js";

export class ObserveHandler {
  private readonly llmClient: LLMClient;
  private readonly defaultModelName: AvailableModel;
  private readonly defaultClientOptions: ClientOptions;
  private readonly resolveLlmClient: (model?: ModelConfiguration) => LLMClient;
  private readonly systemPrompt: string;
  private readonly logInferenceToFile: boolean;
  private readonly experimental: boolean;
  private readonly onMetrics?: (
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ) => void;

  constructor(
    llmClient: LLMClient,
    defaultModelName: AvailableModel,
    defaultClientOptions: ClientOptions,
    resolveLlmClient: (model?: ModelConfiguration) => LLMClient,
    systemPrompt?: string,
    logInferenceToFile?: boolean,
    experimental?: boolean,
    onMetrics?: (
      functionName: V3FunctionName,
      promptTokens: number,
      completionTokens: number,
      reasoningTokens: number,
      cachedInputTokens: number,
      inferenceTimeMs: number,
    ) => void,
  ) {
    this.llmClient = llmClient;
    this.defaultModelName = defaultModelName;
    this.defaultClientOptions = defaultClientOptions;
    this.resolveLlmClient = resolveLlmClient;
    this.systemPrompt = systemPrompt ?? "";
    this.logInferenceToFile = logInferenceToFile ?? false;
    this.experimental = experimental ?? false;
    this.onMetrics = onMetrics;
  }

  async observe(params: ObserveHandlerParams): Promise<Action[]> {
    const { instruction, page, timeout, selector, model } = params;

    const llmClient = this.resolveLlmClient(model);

    const ensureTimeRemaining = createTimeoutGuard(
      timeout,
      (ms) => new ObserveTimeoutError(ms),
    );

    const effectiveInstruction =
      instruction ??
      "Find elements that can be used for any future actions in the page. These may be navigation links, related pages, section/subsection links, buttons, or other interactive elements. Be comprehensive: if there are multiple elements that may be relevant for future actions, return all of them.";

    v3Logger({
      category: "observation",
      message: "starting observation",
      level: 1,
      auxiliary: {
        instruction: {
          value: effectiveInstruction,
          type: "string",
        },
      },
    });

    // Build the hybrid snapshot (a11y-centric text tree + lookup maps)
    const focusSelector = selector?.replace(/^xpath=/i, "") ?? "";
    ensureTimeRemaining();
    const snapshot = await captureHybridSnapshot(page, {
      experimental: this.experimental,
      focusSelector: focusSelector || undefined,
    });

    const combinedTree = snapshot.combinedTree;
    const combinedXpathMap = snapshot.combinedXpathMap ?? {};

    v3Logger({
      category: "observation",
      message: "Got accessibility tree data",
      level: 1,
    });

    // Call the LLM to propose actionable elements
    ensureTimeRemaining();
    const observationResponse = await runObserve({
      instruction: effectiveInstruction,
      domElements: combinedTree,
      llmClient,
      userProvidedInstructions: this.systemPrompt,
      logger: v3Logger,
      logInferenceToFile: this.logInferenceToFile,
      supportedActions: Object.values(SupportedUnderstudyAction),
    });

    const {
      prompt_tokens = 0,
      completion_tokens = 0,
      reasoning_tokens = 0,
      cached_input_tokens = 0,
      inference_time_ms = 0,
    } = observationResponse;

    // Update OBSERVE metrics from the LLM observation call
    this.onMetrics?.(
      V3FunctionName.OBSERVE,
      prompt_tokens,
      completion_tokens,
      reasoning_tokens,
      cached_input_tokens,
      inference_time_ms,
    );

    // Map elementIds -> selectors via combinedXpathMap
    const elementsWithSelectors = (
      await Promise.all(
        observationResponse.elements.map(async (element) => {
          const { elementId, ...rest } = element; // rest may or may not have method/arguments
          if (typeof elementId === "string" && elementId.includes("-")) {
            const lookUpIndex = elementId as EncodedId;
            const xpath = combinedXpathMap[lookUpIndex];
            const trimmedXpath = trimTrailingTextNode(xpath);
            if (!trimmedXpath) return undefined;

            // For dragAndDrop, convert element ID in arguments to xpath (target element)
            let resolvedArgs = rest.arguments;
            if (
              rest.method === "dragAndDrop" &&
              Array.isArray(rest.arguments) &&
              rest.arguments.length > 0
            ) {
              const targetArg = rest.arguments[0];
              // Check if argument looks like an element ID (e.g., "1-67")
              if (
                typeof targetArg === "string" &&
                /^\d+-\d+$/.test(targetArg)
              ) {
                const argXpath = combinedXpathMap[targetArg as EncodedId];
                const trimmedArgXpath = trimTrailingTextNode(argXpath);
                if (trimmedArgXpath) {
                  resolvedArgs = [
                    `xpath=${trimmedArgXpath}`,
                    ...rest.arguments.slice(1),
                  ];
                } else {
                  // Target element lookup failed, filter out this action
                  v3Logger({
                    category: "observation",
                    message: "dragAndDrop target element lookup failed",
                    level: 0,
                    auxiliary: {
                      targetElementId: { value: targetArg, type: "string" },
                      sourceElementId: { value: elementId, type: "string" },
                    },
                  });
                  return undefined;
                }
              } else {
                v3Logger({
                  category: "observation",
                  message: "dragAndDrop target element invalid ID format",
                  level: 0,
                  auxiliary: {
                    targetElementId: { value: targetArg, type: "string" },
                    sourceElementId: { value: elementId, type: "string" },
                  },
                });
                return undefined;
              }
            }

            return {
              ...rest,
              arguments: resolvedArgs,
              selector: `xpath=${trimmedXpath}`,
            } as {
              description: string;
              method?: string;
              arguments?: string[];
              selector: string;
            };
          }
          // shadow-root fallback:
          return {
            description: "an element inside a shadow DOM",
            method: "not-supported",
            arguments: [],
            selector: "not-supported",
          };
        }),
      )
    ).filter(<T>(e: T | undefined): e is T => e !== undefined);

    v3Logger({
      category: "observation",
      message: "found elements",
      level: 1,
      auxiliary: {
        elements: {
          value: JSON.stringify(elementsWithSelectors),
          type: "object",
        },
      },
    });

    return elementsWithSelectors;
  }
}


================================================
FILE: packages/core/lib/v3/handlers/v3AgentHandler.ts
================================================
import { createAgentTools } from "../agent/tools/index.js";
import { buildAgentSystemPrompt } from "../agent/prompts/agentSystemPrompt.js";
import { LogLine } from "../types/public/logs.js";
import { V3 } from "../v3.js";
import {
  ModelMessage,
  ToolSet,
  wrapLanguageModel,
  stepCountIs,
  LanguageModel,
  type LanguageModelUsage,
  type StepResult,
  type GenerateTextOnStepFinishCallback,
  type StreamTextOnStepFinishCallback,
  type PrepareStepFunction,
} from "ai";
import { StagehandZodObject } from "../zodCompat.js";
import { processMessages } from "../agent/utils/messageProcessing.js";
import { LLMClient } from "../llm/LLMClient.js";
import { FlowLogger } from "../flowlogger/FlowLogger.js";
import {
  AgentExecuteOptions,
  AgentStreamExecuteOptions,
  AgentExecuteOptionsBase,
  AgentResult,
  AgentContext,
  AgentState,
  AgentStreamResult,
  AgentStreamCallbacks,
  AgentToolMode,
  AgentModelConfig,
  Variables,
} from "../types/public/agent.js";
import { V3FunctionName } from "../types/public/methods.js";
import { mapToolResultToActions } from "../agent/utils/actionMapping.js";
import {
  MissingLLMConfigurationError,
  MissingEnvironmentVariableError,
  StreamingCallbacksInNonStreamingModeError,
  AgentAbortError,
} from "../types/public/sdkErrors.js";
import { handleDoneToolCall } from "../agent/utils/handleDoneToolCall.js";
import {
  CaptchaSolver,
  CAPTCHA_SOLVED_MSG,
  CAPTCHA_ERRORED_MSG,
} from "../agent/utils/captchaSolver.js";

function getErrorMessage(error: unknown): string {
  return error instanceof Error ? error.message : String(error);
}

/**
 * Prepends a system message with cache control to the messages array.
 * The cache control providerOptions are used by Anthropic and ignored by other providers.
 */
function prependSystemMessage(
  systemPrompt: string,
  messages: ModelMessage[],
): ModelMessage[] {
  return [
    {
      role: "system",
      content: systemPrompt,
      providerOptions: {
        anthropic: {
          cacheControl: { type: "ephemeral" },
        },
      },
    },
    ...messages,
  ];
}

export class V3AgentHandler {
  private v3: V3;
  private logger: (message: LogLine) => void;
  private llmClient: LLMClient;
  private executionModel?: string | AgentModelConfig;
  private systemInstructions?: string;
  private mcpTools?: ToolSet;
  private mode: AgentToolMode;
  private captchaAutoSolveEnabled: boolean;

  constructor(
    v3: V3,
    logger: (message: LogLine) => void,
    llmClient: LLMClient,
    executionModel?: string | AgentModelConfig,
    systemInstructions?: string,
    mcpTools?: ToolSet,
    mode?: AgentToolMode,
    captchaAutoSolveEnabled?: boolean,
  ) {
    this.v3 = v3;
    this.logger = logger;
    this.llmClient = llmClient;
    this.executionModel = executionModel;
    this.systemInstructions = systemInstructions;
    this.mcpTools = mcpTools;
    this.mode = mode ?? "dom";
    this.captchaAutoSolveEnabled = captchaAutoSolveEnabled ?? false;
  }

  private async prepareAgent(
    instructionOrOptions: string | AgentExecuteOptionsBase,
  ): Promise<AgentContext> {
    try {
      const options =
        typeof instructionOrOptions === "string"
          ? { instruction: instructionOrOptions }
          : instructionOrOptions;

      const maxSteps = options.maxSteps || 20;

      // Get the initial page URL first (needed for the system prompt)
      const initialPageUrl = (await this.v3.context.awaitActivePage()).url();

      // Build the system prompt with mode-aware tool guidance
      const systemPrompt = buildAgentSystemPrompt({
        url: initialPageUrl,
        executionInstruction: options.instruction,
        mode: this.mode,
        systemInstructions: this.systemInstructions,
        captchasAutoSolve: this.v3.isCaptchaAutoSolveEnabled,
        excludeTools: options.excludeTools,
        variables: options.variables,
        useSearch: options.useSearch,
      });

      if (options.useSearch) {
        const bbApiKey = this.v3.browserbaseApiKey;
        if (!bbApiKey) {
          throw new MissingEnvironmentVariableError(
            "BROWSERBASE_API_KEY",
            "agent search (useSearch: true)",
          );
        }
      }

      const tools = this.createTools(
        options.excludeTools,
        options.variables,
        options.toolTimeout,
        options.useSearch,
      );
      const allTools: ToolSet = { ...tools, ...this.mcpTools };

      // Use provided messages for continuation, or start fresh with the instruction
      const messages: ModelMessage[] = options.messages?.length
        ? [...options.messages, { role: "user", content: options.instruction }]
        : [{ role: "user", content: options.instruction }];

      if (!this.llmClient?.getLanguageModel) {
        throw new MissingLLMConfigurationError();
      }
      const baseModel = this.llmClient.getLanguageModel();
      //to do - we likely do not need middleware anymore
      const wrappedModel = wrapLanguageModel({
        model: baseModel,
        middleware: {
          ...FlowLogger.createLlmLoggingMiddleware(baseModel.modelId),
        },
      });

      if (
        this.mode === "hybrid" &&
        !baseModel.modelId.includes("gemini-3-flash") &&
        !baseModel.modelId.includes("claude")
      ) {
        this.logger({
          category: "agent",
          message: `Warning: "${baseModel.modelId}" may not perform well in hybrid mode. See recommended models: https://docs.stagehand.dev/v3/basics/agent#hybrid-mode`,
          level: 0,
        });
      }

      return {
        options,
        maxSteps,
        systemPrompt,
        allTools,
        messages,
        wrappedModel,
        initialPageUrl,
      };
    } catch (error) {
      this.logger({
        category: "agent",
        message: `failed to prepare agent: ${error}`,
        level: 0,
      });
      throw error;
    }
  }
  private createPrepareStep(
    userCallback?: PrepareStepFunction<ToolSet>,
    captchaSolver?: CaptchaSolver,
  ): PrepareStepFunction<ToolSet> {
    return async (options) => {
      processMessages(options.messages);
      if (captchaSolver) {
        if (captchaSolver.isSolving()) {
          this.logger({
            category: "agent",
            message:
              "Captcha detected — waiting for Browserbase to solve it before continuing",
            level: 1,
          });
        }
        await captchaSolver.waitIfSolving();
        const { solved, errored } = captchaSolver.consumeSolveResult();
        if (solved) {
          options.messages.push({
            role: "user",
            content: CAPTCHA_SOLVED_MSG,
          });
          this.logger({
            category: "agent",
            message:
              "Captcha solved — injected notification into agent message stream",
            level: 1,
          });
        }
        if (errored) {
          options.messages.push({
            role: "user",
            content: CAPTCHA_ERRORED_MSG,
          });
          this.logger({
            category: "agent",
            message:
              "Captcha solver failed — injected error notification into agent message stream",
            level: 1,
          });
        }
      }
      if (userCallback) {
        return userCallback(options);
      }
      return options;
    };
  }

  private createStepHandler(
    state: AgentState,
    userCallback?:
      | GenerateTextOnStepFinishCallback<ToolSet>
      | StreamTextOnStepFinishCallback<ToolSet>,
  ) {
    return async (event: StepResult<ToolSet>) => {
      this.logger({
        category: "agent",
        message: `Step finished: ${event.finishReason}`,
        level: 2,
      });

      if (event.toolCalls && event.toolCalls.length > 0) {
        for (let i = 0; i < event.toolCalls.length; i++) {
          const toolCall = event.toolCalls[i];
          const args = toolCall.input;
          const toolResult = event.toolResults?.[i];

          if (event.text && event.text.length > 0) {
            state.collectedReasoning.push(event.text);
            this.logger({
              category: "agent",
              message: `reasoning: ${event.text}`,
              level: 1,
            });
          }

          if (toolCall.toolName === "done") {
            state.completed = true;
            if (args?.taskComplete) {
              const doneReasoning = args.reasoning;
              const allReasoning = state.collectedReasoning.join(" ");
              state.finalMessage = doneReasoning
                ? `${allReasoning} ${doneReasoning}`.trim()
                : allReasoning || "Task completed successfully";
            }
          }
          const mappedActions = mapToolResultToActions({
            toolCallName: toolCall.toolName,
            toolResult,
            args,
            reasoning: event.text || undefined,
          });

          for (const action of mappedActions) {
            action.pageUrl = state.currentPageUrl;
            action.timestamp = Date.now();
            state.actions.push(action);
          }
        }
        state.currentPageUrl = (await this.v3.context.awaitActivePage()).url();
      }

      if (userCallback) {
        await userCallback(event);
      }
    };
  }

  public async execute(
    instructionOrOptions: string | AgentExecuteOptions,
  ): Promise<AgentResult> {
    const startTime = Date.now();
    const options =
      typeof instructionOrOptions === "object" ? instructionOrOptions : null;
    const signal = options?.signal;

    // Highlight cursor defaults to true for hybrid mode, can be overridden
    const shouldHighlightCursor =
      options?.highlightCursor ?? this.mode === "hybrid";

    const state: AgentState = {
      collectedReasoning: [],
      actions: [],
      finalMessage: "",
      completed: false,
      currentPageUrl: "",
    };

    let messages: ModelMessage[] = [];
    let captchaSolver: CaptchaSolver | undefined;

    try {
      const {
        options: preparedOptions,
        maxSteps,
        systemPrompt,
        allTools,
        messages: preparedMessages,
        wrappedModel,
        initialPageUrl,
      } = await this.prepareAgent(instructionOrOptions);

      // Enable cursor overlay for hybrid mode (coordinate-based interactions)
      if (shouldHighlightCursor && this.mode === "hybrid") {
        const page = await this.v3.context.awaitActivePage();
        await page.enableCursorOverlay().catch(() => {});
      }

      // Set up captcha solver for Browserbase environments
      if (this.captchaAutoSolveEnabled) {
        captchaSolver = new CaptchaSolver();
        captchaSolver.init(() => this.v3.context.awaitActivePage());
      }

      messages = preparedMessages;
      state.currentPageUrl = initialPageUrl;

      const callbacks = (instructionOrOptions as AgentExecuteOptions).callbacks;

      if (callbacks) {
        const streamingOnlyCallbacks = [
          "onChunk",
          "onFinish",
          "onError",
          "onAbort",
        ];
        const invalidCallbacks = streamingOnlyCallbacks.filter(
          (name) => callbacks[name as keyof typeof callbacks] != null,
        );
        if (invalidCallbacks.length > 0) {
          throw new StreamingCallbacksInNonStreamingModeError(invalidCallbacks);
        }
      }

      const result = await this.llmClient.generateText({
        model: wrappedModel,
        messages: prependSystemMessage(systemPrompt, messages),
        tools: allTools,
        stopWhen: (result) => this.handleStop(result, maxSteps),
        temperature: 1,
        toolChoice: "auto",

        prepareStep: this.createPrepareStep(
          callbacks?.prepareStep,
          captchaSolver,
        ),
        onStepFinish: this.createStepHandler(state, callbacks?.onStepFinish),
        abortSignal: preparedOptions.signal,
        providerOptions: {
          google: { mediaResolution: "MEDIA_RESOLUTION_HIGH" },
          openai: { store: false },
        },
      });

      const allMessages = [...messages, ...(result.response?.messages || [])];
      const doneResult = await this.ensureDone(
        state,
        wrappedModel,
        allMessages,
        preparedOptions.instruction,
        preparedOptions.output,
        this.logger,
      );

      return this.consolidateMetricsAndResult(
        startTime,
        state,
        doneResult.messages,
        result,
        maxSteps,
        doneResult.output,
      );
    } catch (error) {
      // Re-throw validation errors that should propagate to the caller
      if (
        error instanceof StreamingCallbacksInNonStreamingModeError ||
        error instanceof MissingEnvironmentVariableError
      ) {
        throw error;
      }

      // Re-throw abort errors wrapped in AgentAbortError for consistent error typing
      if (signal?.aborted) {
        const reason = signal.reason ? String(signal.reason) : "aborted";
        throw new AgentAbortError(reason);
      }

      const errorMessage = getErrorMessage(error);
      this.logger({
        category: "agent",
        message: `Error executing agent task: ${errorMessage}`,
        level: 0,
      });

      // For non-abort errors, return a failure result instead of throwing
      return {
        success: false,
        actions: state.actions,
        message: `Failed to execute task: ${errorMessage}`,
        completed: false,
        messages,
      };
    } finally {
      captchaSolver?.dispose();
    }
  }

  public async stream(
    instructionOrOptions: string | AgentStreamExecuteOptions,
  ): Promise<AgentStreamResult> {
    const streamOptions =
      typeof instructionOrOptions === "object" ? instructionOrOptions : null;

    // Highlight cursor defaults to true for hybrid mode, can be overridden
    const shouldHighlightCursor =
      streamOptions?.highlightCursor ?? this.mode === "hybrid";

    const {
      options,
      maxSteps,
      systemPrompt,
      allTools,
      messages,
      wrappedModel,
      initialPageUrl,
    } = await this.prepareAgent(instructionOrOptions);

    // Enable cursor overlay for hybrid mode (coordinate-based interactions)
    if (shouldHighlightCursor && this.mode === "hybrid") {
      const page = await this.v3.context.awaitActivePage();
      await page.enableCursorOverlay().catch(() => {});
    }

    // Set up captcha solver for Browserbase environments
    let captchaSolver: CaptchaSolver | undefined;
    if (this.captchaAutoSolveEnabled) {
      captchaSolver = new CaptchaSolver();
      captchaSolver.init(() => this.v3.context.awaitActivePage());
    }

    const callbacks = (instructionOrOptions as AgentStreamExecuteOptions)
      .callbacks as AgentStreamCallbacks | undefined;

    const state: AgentState = {
      collectedReasoning: [],
      actions: [],
      finalMessage: "",
      completed: false,
      currentPageUrl: initialPageUrl,
    };
    const startTime = Date.now();

    let resolveResult: (value: AgentResult | PromiseLike<AgentResult>) => void;
    let rejectResult: (reason: unknown) => void;
    const resultPromise = new Promise<AgentResult>((resolve, reject) => {
      resolveResult = resolve;
      rejectResult = reject;
    });

    const handleError = (error: unknown) => {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      this.logger({
        category: "agent",
        message: `Error during streaming: ${errorMessage}`,
        level: 0,
      });
      rejectResult(error);
    };

    let streamResult: ReturnType<typeof this.llmClient.streamText>;
    try {
      streamResult = this.llmClient.streamText({
        model: wrappedModel,
        messages: prependSystemMessage(systemPrompt, messages),
        tools: allTools,
        stopWhen: (result) => this.handleStop(result, maxSteps),
        temperature: 1,
        toolChoice: "auto",
        prepareStep: this.createPrepareStep(
          callbacks?.prepareStep,
          captchaSolver,
        ),
        onStepFinish: this.createStepHandler(state, callbacks?.onStepFinish),
        onError: (event) => {
          captchaSolver?.dispose();
          if (callbacks?.onError) {
            callbacks.onError(event);
          }
          handleError(event.error);
        },
        onChunk: callbacks?.onChunk,
        onFinish: (event) => {
          captchaSolver?.dispose();
          if (callbacks?.onFinish) {
            callbacks.onFinish(event);
          }

          const allMessages = [
            ...messages,
            ...(event.response?.messages || []),
          ];
          this.ensureDone(
            state,
            wrappedModel,
            allMessages,
            options.instruction,
            options.output,
            this.logger,
          ).then((doneResult) => {
            const result = this.consolidateMetricsAndResult(
              startTime,
              state,
              doneResult.messages,
              event,
              maxSteps,
              doneResult.output,
            );
            resolveResult(result);
          });
        },
        onAbort: (event) => {
          captchaSolver?.dispose();
          if (callbacks?.onAbort) {
            callbacks.onAbort(event);
          }
          // Reject the result promise with AgentAbortError when stream is aborted
          const reason = options.signal?.reason
            ? String(options.signal.reason)
            : "Stream was aborted";
          rejectResult(new AgentAbortError(reason));
        },
        abortSignal: options.signal,
        providerOptions: {
          google: { mediaResolution: "MEDIA_RESOLUTION_HIGH" },
          openai: { store: false },
        },
      });
    } catch (error) {
      captchaSolver?.dispose();
      throw error;
    }

    const agentStreamResult = streamResult as AgentStreamResult;
    agentStreamResult.result = resultPromise;
    return agentStreamResult;
  }

  private consolidateMetricsAndResult(
    startTime: number,
    state: AgentState,
    inputMessages: ModelMessage[],
    result: {
      text?: string;
      totalUsage?: LanguageModelUsage;
      response?: { messages?: ModelMessage[] };
      steps?: StepResult<ToolSet>[];
    },
    maxSteps?: number,
    output?: Record<string, unknown>,
  ): AgentResult {
    if (!state.finalMessage) {
      const allReasoning = state.collectedReasoning.join(" ").trim();

      if (!state.completed && maxSteps && result.steps?.length >= maxSteps) {
        this.logger({
          category: "agent",
          message: `Agent stopped: reached maximum steps (${maxSteps})`,
          level: 1,
        });
        state.finalMessage = `Agent stopped: reached maximum steps (${maxSteps})`;
      } else {
        state.finalMessage = allReasoning || result.text || "";
      }
    }

    const endTime = Date.now();
    const inferenceTimeMs = endTime - startTime;
    if (result.totalUsage) {
      this.v3.updateMetrics(
        V3FunctionName.AGENT,
        result.totalUsage.inputTokens || 0,
        result.totalUsage.outputTokens || 0,
        result.totalUsage.reasoningTokens || 0,
        result.totalUsage.cachedInputTokens || 0,
        inferenceTimeMs,
      );
    }

    return {
      success: state.completed,
      message: state.finalMessage || "Task execution completed",
      actions: state.actions,
      completed: state.completed,
      output,
      usage: result.totalUsage
        ? {
            input_tokens: result.totalUsage.inputTokens || 0,
            output_tokens: result.totalUsage.outputTokens || 0,
            reasoning_tokens: result.totalUsage.reasoningTokens || 0,
            cached_input_tokens: result.totalUsage.cachedInputTokens || 0,
            inference_time_ms: inferenceTimeMs,
          }
        : undefined,
      messages: inputMessages,
    };
  }

  private createTools(
    excludeTools?: string[],
    variables?: Variables,
    toolTimeout?: number,
    useSearch?: boolean,
  ) {
    const provider = this.llmClient?.getLanguageModel?.()?.provider;
    return createAgentTools(this.v3, {
      executionModel: this.executionModel,
      logger: this.logger,
      mode: this.mode,
      provider,
      excludeTools,
      variables,
      toolTimeout,
      useSearch,
      browserbaseApiKey: useSearch ? this.v3.browserbaseApiKey : undefined,
    });
  }

  private handleStop(
    result: Parameters<ReturnType<typeof stepCountIs>>[0],
    maxSteps: number,
  ): boolean | PromiseLike<boolean> {
    const lastStep = result.steps[result.steps.length - 1];
    if (lastStep?.toolCalls?.some((tc) => tc.toolName === "done")) {
      return true;
    }
    return stepCountIs(maxSteps)(result);
  }

  /**
   * Ensures the done tool is called at the end of agent execution.
   * Returns the messages and any extracted output from the done call.
   */
  private async ensureDone(
    state: AgentState,
    model: LanguageModel,
    messages: ModelMessage[],
    instruction: string,
    outputSchema?: StagehandZodObject,
    logger?: (message: LogLine) => void,
  ): Promise<{ messages: ModelMessage[]; output?: Record<string, unknown> }> {
    if (state.completed) return { messages };

    const doneResult = await handleDoneToolCall({
      model,
      inputMessages: messages,
      instruction,
      outputSchema,
      logger,
    });

    state.completed = doneResult.taskComplete;
    state.finalMessage = doneResult.reasoning;

    const doneAction = mapToolResultToActions({
      toolCallName: "done",
      toolResult: {
        success: true,
        reasoning: doneResult.reasoning,
        taskComplete: doneResult.taskComplete,
      },
      args: {
        reasoning: doneResult.reasoning,
        taskComplete: doneResult.taskComplete,
      },
      reasoning: doneResult.reasoning,
    });

    for (const action of doneAction) {
      action.pageUrl = state.currentPageUrl;
      action.timestamp = Date.now();
      state.actions.push(action);
    }

    return {
      messages: [...messages, ...doneResult.messages],
      output: doneResult.output,
    };
  }
}


================================================
FILE: packages/core/lib/v3/handlers/v3CuaAgentHandler.ts
================================================
import { computeActiveElementXpath } from "../understudy/a11y/snapshot/index.js";
import { V3 } from "../v3.js";
import { ToolSet } from "ai";
import { AgentClient } from "../agent/AgentClient.js";
import { AgentProvider } from "../agent/AgentProvider.js";
import { GoogleCUAClient } from "../agent/GoogleCUAClient.js";
import { OpenAICUAClient } from "../agent/OpenAICUAClient.js";
import { mapKeyToPlaywright } from "../agent/utils/cuaKeyMapping.js";
import { ensureXPath } from "../agent/utils/xpath.js";
import {
  ActionExecutionResult,
  AgentAction,
  AgentExecuteOptions,
  AgentHandlerOptions,
  AgentResult,
  SafetyConfirmationHandler,
} from "../types/public/agent.js";
import { LogLine } from "../types/public/logs.js";
import { type Action, V3FunctionName } from "../types/public/methods.js";
import { FlowLogger } from "../flowlogger/FlowLogger.js";
import { toTitleCase } from "../../utils.js";
import { StagehandClosedError } from "../types/public/sdkErrors.js";
import {
  CaptchaSolver,
  CAPTCHA_SOLVED_MSG,
  CAPTCHA_ERRORED_MSG,
} from "../agent/utils/captchaSolver.js";

export class V3CuaAgentHandler {
  private v3: V3;
  private agent: AgentClient;
  private provider: AgentProvider;
  private logger: (message: LogLine) => void;
  private agentClient: AgentClient;
  private options: AgentHandlerOptions;
  private highlightCursor: boolean;
  private captchaSolver: CaptchaSolver | null = null;
  private captchaClickGuardRemaining = 0;
  private currentInstruction = "";

  constructor(
    v3: V3,
    logger: (message: LogLine) => void,
    options: AgentHandlerOptions,
    tools?: ToolSet,
  ) {
    this.v3 = v3;
    this.logger = logger;
    this.options = options;

    this.provider = new AgentProvider(logger);
    const client = this.provider.getClient(
      options.modelName,
      options.clientOptions || {},
      options.userProvidedInstructions,
      tools,
    );
    this.agentClient = client;
    this.setupAgentClient();
    this.agent = client;
  }

  /**
   * Ensures the V3 context is still available (not closed).
   * Throws StagehandClosedError if stagehand.close() was called.
   */
  private ensureNotClosed(): void {
    if (!this.v3.context) {
      throw new StagehandClosedError();
    }
  }

  private setupAgentClient(): void {
    // Provide screenshots to the agent client
    this.agentClient.setScreenshotProvider(async () => {
      this.ensureNotClosed();
      const page = await this.v3.context.awaitActivePage();
      const screenshotBuffer = await page.screenshot({ fullPage: false });
      return screenshotBuffer.toString("base64"); // base64 png
    });

    // Provide action executor
    this.agentClient.setActionHandler(async (action) => {
      this.ensureNotClosed();

      // Wait for captcha solver to finish before executing action
      if (this.captchaSolver) {
        if (this.captchaSolver.isSolving()) {
          this.logger({
            category: "agent",
            message:
              "Captcha detected — waiting for Browserbase to solve it before continuing",
            level: 1,
          });
        }
        await this.captchaSolver.waitIfSolving();
        this.handleCaptchaSolveResult(this.captchaSolver.consumeSolveResult());
      }

      action.pageUrl = (await this.v3.context.awaitActivePage()).url();
      if (await this.shouldSkipSolvedCaptchaInteraction(action)) {
        this.captchaClickGuardRemaining = Math.max(
          0,
          this.captchaClickGuardRemaining - 1,
        );
        this.agentClient.addContextNote(
          `The captcha has already been solved automatically. Do not click the captcha checkbox, widget, or challenge again. Continue with the original task outside the captcha area. Original task: ${this.currentInstruction}`,
        );
        this.logger({
          category: "agent",
          message:
            "Skipped click on solved captcha widget — injected follow-up guidance",
          level: 1,
        });
        return;
      }

      const defaultDelay = 500;
      const waitBetween =
        (this.options.clientOptions?.waitBetweenActions as number) ||
        defaultDelay;
      try {
        // Try to inject cursor before each action if enabled
        if (this.highlightCursor) {
          try {
            await this.injectCursor();
          } catch {
            // Ignore cursor injection failures
          }
        }
        await new Promise((r) => setTimeout(r, 300));
        // Skip logging for screenshot actions - they're no-ops, the actual
        // Page.screenshot in captureAndSendScreenshot() is logged separately
        const shouldLog = action.type !== "screenshot";
        if (shouldLog) {
          await FlowLogger.runWithLogging(
            {
              eventType: `V3Cua${toTitleCase(action.type)}`, // e.g. "V3CuaClick"
              data: {
                target: this.computePointerTarget(action),
              },
            },
            async (loggedAction: typeof action) =>
              await this.executeAction(loggedAction),
            [action],
          );
        } else {
          await this.executeAction(action);
        }

        action.timestamp = Date.now();

        await new Promise((r) => setTimeout(r, waitBetween));
        try {
          await this.captureAndSendScreenshot();
        } catch (e) {
          this.logger({
            category: "agent",
            message: `Warning: Failed to take screenshot after action: ${String(
              (e as Error)?.message ?? e,
            )}`,
            level: 1,
          });
        }
      } catch (error) {
        const msg = (error as Error)?.message ?? String(error);
        this.logger({
          category: "agent",
          message: `Error executing action ${action.type}: ${msg}`,
          level: 0,
        });
        throw error;
      }
    });

    void this.updateClientViewport();
    void this.updateClientUrl();
  }

  setSafetyConfirmationHandler(handler?: SafetyConfirmationHandler): void {
    if (
      this.agentClient instanceof GoogleCUAClient ||
      this.agentClient instanceof OpenAICUAClient
    ) {
      this.agentClient.setSafetyConfirmationHandler(handler);
    }
  }

  async execute(
    optionsOrInstruction: AgentExecuteOptions | string,
  ): Promise<AgentResult> {
    const options =
      typeof optionsOrInstruction === "string"
        ? { instruction: optionsOrInstruction }
        : optionsOrInstruction;

    this.setSafetyConfirmationHandler(options.callbacks?.onSafetyConfirmation);

    this.highlightCursor = options.highlightCursor !== false;
    this.currentInstruction = options.instruction;

    // Redirect if blank
    const page = await this.v3.context.awaitActivePage();
    const currentUrl = page.url();
    if (!currentUrl || currentUrl === "about:blank") {
      this.logger({
        category: "agent",
        message: `Page URL is empty. Navigating to https://www.google.com ...`,
        level: 1,
      });
      await page.goto("https://www.google.com", { waitUntil: "load" });
    }

    // Set up captcha solver for Browserbase environments
    if (this.v3.isCaptchaAutoSolveEnabled) {
      this.captchaSolver = new CaptchaSolver();
      this.captchaSolver.init(() => this.v3.context.awaitActivePage());

      // Block the CUA agent loop before each step while a captcha is being solved
      this.agentClient.setPreStepHook(async () => {
        if (this.captchaSolver?.isSolving()) {
          this.logger({
            category: "agent",
            message:
              "Captcha detected — waiting for Browserbase to solve it before continuing",
            level: 1,
          });
        }
        await this.captchaSolver?.waitIfSolving();
        this.handleCaptchaSolveResult(this.captchaSolver?.consumeSolveResult());
      });
    }

    if (this.highlightCursor) {
      try {
        await this.injectCursor();
      } catch (error) {
        const errorMessage =
          error instanceof Error ? error.message : String(error);
        this.logger({
          category: "agent",
          message: `Warning: Failed to inject cursor: ${errorMessage}. Continuing with execution.`,
          level: 1,
        });
        // Continue execution even if cursor injection fails
      }
    }

    const start = Date.now();
    let result: AgentResult;
    try {
      result = await this.agent.execute({ options, logger: this.logger });
    } finally {
      this.captchaSolver?.dispose();
      this.captchaSolver = null;
    }
    const inferenceTimeMs = Date.now() - start;
    if (result.usage) {
      this.v3.updateMetrics(
        V3FunctionName.AGENT,
        result.usage.input_tokens,
        result.usage.output_tokens,
        result.usage.reasoning_tokens ?? 0,
        result.usage.cached_input_tokens ?? 0,
        inferenceTimeMs,
      );
    }
    return result;
  }

  private async executeAction(
    action: AgentAction,
  ): Promise<ActionExecutionResult> {
    const page = await this.v3.context.awaitActivePage();
    const recording = this.v3.isAgentReplayActive();
    switch (action.type) {
      case "click": {
        const { x, y, button = "left", clickCount } = action;
        if (recording) {
          const xpath = await page.click(x as number, y as number, {
            button: (button as "left" | "right" | "middle") ?? "left",
            clickCount: (clickCount as number) ?? 1,
            returnXpath: true,
          });
          const normalized = ensureXPath(xpath);
          if (normalized) {
            const stagehandAction: Action = {
              selector: normalized,
              description: this.describePointerAction("click", x, y),
              method: "click",
              arguments: [],
            };
            this.recordCuaActStep(
              action,
              [stagehandAction],
              stagehandAction.description,
            );
          }
        } else {
          await page.click(x as number, y as number, {
            button: (button as "left" | "right" | "middle") ?? "left",
            clickCount: (clickCount as number) ?? 1,
          });
        }
        return { success: true };
      }
      case "double_click":
      case "doubleClick": {
        const { x, y } = action;
        if (recording) {
          const xpath = await page.click(x as number, y as number, {
            button: "left",
            clickCount: 2,
            returnXpath: true,
          });
          const normalized = ensureXPath(xpath);
          if (normalized) {
            const stagehandAction: Action = {
              selector: normalized,
              description: this.describePointerAction("double click", x, y),
              method: "doubleClick",
              arguments: [],
            };
            this.recordCuaActStep(
              action,
              [stagehandAction],
              stagehandAction.description,
            );
          }
        } else {
          await page.click(x as number, y as number, {
            button: "left",
            clickCount: 2,
          });
        }
        return { success: true };
      }
      case "tripleClick": {
        const { x, y } = action;
        if (recording) {
          const xpath = await page.click(x as number, y as number, {
            button: "left",
            clickCount: 3,
            returnXpath: true,
          });
          const normalized = ensureXPath(xpath);
          if (normalized) {
            const stagehandAction: Action = {
              selector: normalized,
              description: this.describePointerAction("triple click", x, y),
              method: "tripleClick",
              arguments: [],
            };
            this.recordCuaActStep(
              action,
              [stagehandAction],
              stagehandAction.description,
            );
          }
        } else {
          await page.click(x as number, y as number, {
            clickCount: 3,
          });
        }
        return { success: true };
      }
      case "type": {
        const { text } = action;
        await page.type(String(text ?? ""));
        if (recording) {
          const xpath = await computeActiveElementXpath(page);
          const normalized = ensureXPath(xpath);
          if (normalized) {
            const stagehandAction: Action = {
              selector: normalized,
              description: this.describeTypeAction(String(text ?? "")),
              method: "type",
              arguments: [String(text ?? "")],
            };
            this.recordCuaActStep(
              action,
              [stagehandAction],
              stagehandAction.description,
            );
          }
        }
        return { success: true };
      }
      case "keypress": {
        const { keys } = action;
        const keyList = Array.isArray(keys) ? keys : [keys];
        const stagehandActions: Action[] = [];
        for (const rawKey of keyList) {
          const mapped = mapKeyToPlaywright(String(rawKey ?? ""));
          await page.keyPress(mapped);
          if (recording) {
            stagehandActions.push({
              selector: "xpath=/html",
              description: `press ${mapped}`,
              method: "press",
              arguments: [mapped],
            });
          }
        }
        if (recording && stagehandActions.length > 0) {
          this.recordCuaActStep(
            action,
            stagehandActions,
            stagehandActions
              .map((a) => a.description)
              .filter(Boolean)
              .join(", ") || "keypress",
          );
        }
        return { success: true };
      }
      case "scroll": {
        const { x, y, scroll_x = 0, scroll_y = 0 } = action;
        await page.scroll(
          (x as number) ?? 0,
          (y as number) ?? 0,
          (scroll_x as number) ?? 0,
          (scroll_y as number) ?? 0,
        );
        this.v3.recordAgentReplayStep({
          type: "scroll",
          deltaX: Number(scroll_x ?? 0),
          deltaY: Number(scroll_y ?? 0),
          anchor:
            typeof x === "number" && typeof y === "number"
              ? { x: Math.round(x), y: Math.round(y) }
              : undefined,
        });
        return { success: true };
      }
      case "drag": {
        const { path } = action;
        if (Array.isArray(path) && path.length >= 2) {
          const start = path[0];
          const end = path[path.length - 1];
          if (recording) {
            const xps = await page.dragAndDrop(start.x, start.y, end.x, end.y, {
              steps: Math.min(20, Math.max(5, path.length)),
              delay: 10,
              returnXpath: true,
            });
            const [fromXpath, toXpath] = (xps as [string, string]) || ["", ""];
            const from = ensureXPath(fromXpath);
            const to = ensureXPath(toXpath);
            if (from && to) {
              const stagehandAction: Action = {
                selector: from,
                description: this.describeDragAction(),
                method: "dragAndDrop",
                arguments: [to],
              };
              this.recordCuaActStep(
                action,
                [stagehandAction],
                stagehandAction.description,
              );
            }
          } else {
            await page.dragAndDrop(start.x, start.y, end.x, end.y, {
              steps: Math.min(20, Math.max(5, path.length)),
              delay: 10,
            });
          }
        }
        return { success: true };
      }
      case "move": {
        const { x, y } = action;
        if (typeof x === "number" && typeof y === "number") {
          if (recording) {
            const xpath = await page.hover(x, y, { returnXpath: true });
            const normalized = ensureXPath(xpath);
            if (normalized) {
              const stagehandAction: Action = {
                selector: normalized,
                description: this.describePointerAction("hover", x, y),
                method: "hover",
                arguments: [],
              };
              this.recordCuaActStep(
                action,
                [stagehandAction],
                stagehandAction.description,
              );
            }
          } else {
            await page.hover(x, y);
          }
        }
        return { success: true };
      }
      case "wait": {
        const time = action?.timeMs ?? 1000;
        await new Promise((r) => setTimeout(r, time));
        if (time > 0 && recording) {
          this.v3.recordAgentReplayStep({ type: "wait", timeMs: Number(time) });
        }
        return { success: true };
      }
      case "screenshot": {
        // No-op - screenshot is captured by captureAndSendScreenshot() after all actions
        return { success: true };
      }
      case "goto": {
        const { url } = action;
        await page.goto(String(url ?? ""), { waitUntil: "load" });
        if (recording) {
          this.v3.recordAgentReplayStep({
            type: "goto",
            url: String(url ?? ""),
          });
        }
        return { success: true };
      }
      case "back": {
        await page.goBack();
        if (recording) {
          this.v3.recordAgentReplayStep({
            type: "back",
          });
        }
        return { success: true };
      }
      case "forward": {
        await page.goForward();
        if (recording) {
          this.v3.recordAgentReplayStep({
            type: "forward",
          });
        }
        return { success: true };
      }
      case "open_web_browser": {
        // Browser is already open, this is a no-op
        return { success: true };
      }
      case "custom_tool": {
        // Custom tools are handled by the agent client directly
        return { success: true };
      }
      default:
        this.logger({
          category: "agent",
          message: `Unknown action type: ${String(action.type)}`,
          level: 1,
        });
        return {
          success: false,
          error: `Unknown action ${String(action.type)}`,
        };
    }
  }

  // helper to make pointer target human-readable for logging
  private computePointerTarget(action: AgentAction): string | undefined {
    return typeof action.x === "number" && typeof action.y === "number"
      ? `(${action.x}, ${action.y})`
      : typeof action.selector === "string"
        ? action.selector
        : typeof action.input === "string"
          ? action.input
          : typeof action.description === "string"
            ? action.description
            : undefined;
  }

  private describePointerAction(kind: string, x: unknown, y: unknown): string {
    const nx = Number(x);
    const ny = Number(y);
    if (Number.isFinite(nx) && Number.isFinite(ny)) {
      return `${kind} at (${Math.round(nx)}, ${Math.round(ny)})`;
    }
    return kind;
  }

  private describeTypeAction(text: string): string {
    const snippet = text.length > 30 ? `${text.slice(0, 27)}...` : text;
    return `type "${snippet}"`;
  }

  private describeDragAction(): string {
    return "drag and drop";
  }

  private buildInstructionFallback(
    agentAction: AgentAction,
    fallback: string,
  ): string {
    const raw =
      (typeof agentAction.action === "string" && agentAction.action.trim()) ||
      (typeof agentAction.reasoning === "string" &&
        agentAction.reasoning.trim());
    return raw && raw.length > 0 ? raw : fallback;
  }

  private recordCuaActStep(
    agentAction: AgentAction,
    stagehandActions: Action[],
    fallback: string,
  ): void {
    if (!stagehandActions.length) return;
    const instruction = this.buildInstructionFallback(agentAction, fallback);
    const description = stagehandActions[0]?.description || instruction;
    const actions = stagehandActions.map((act) => ({
      ...act,
      description: act.description || description,
    }));
    this.v3.recordAgentReplayStep({
      type: "act",
      instruction,
      actions,
      actionDescription: description,
      message:
        typeof agentAction.reasoning === "string" &&
        agentAction.reasoning.trim().length > 0
          ? agentAction.reasoning.trim()
          : undefined,
    });
  }

  private async updateClientViewport(): Promise<void> {
    try {
      // For Google CUA, use configured viewport for coordinate normalization
      // advancedStealth uses fixed 1288x711, otherwise use configured viewport
      if (this.agentClient instanceof GoogleCUAClient) {
        const dims = this.v3.isAdvancedStealth
          ? { width: 1288, height: 711 }
          : this.v3.configuredViewport;
        this.agentClient.setViewport(dims.width, dims.height);
      } else {
        // For other clients, use actual window dimensions
        const page = await this.v3.context.awaitActivePage();
        const { w, h } = await page.mainFrame().evaluate<{
          w: number;
          h: number;
        }>("({ w: window.innerWidth, h: window.innerHeight })");
        if (w && h) this.agentClient.setViewport(w, h);
      }
    } catch {
      //
    }
  }

  private async updateClientUrl(): Promise<void> {
    try {
      const page = await this.v3.context.awaitActivePage();
      const url = page.url();
      this.agentClient.setCurrentUrl(url);
    } catch {
      //
    }
  }

  async captureAndSendScreenshot(): Promise<unknown> {
    this.logger({
      category: "agent",
      message: "Capturing screenshot",
      level: 1,
    });
    try {
      const page = await this.v3.context.awaitActivePage();
      const screenshotBuffer = await page.screenshot({ fullPage: false });

      const currentUrl = page.url();
      return await this.agentClient.captureScreenshot({
        base64Image: screenshotBuffer.toString("base64"),
        currentUrl,
      });
    } catch (e) {
      this.logger({
        category: "agent",
        message: `Error capturing screenshot: ${String((e as Error)?.message ?? e)}`,
        level: 0,
      });
      return null;
    }
  }

  private handleCaptchaSolveResult(result?: {
    solved: boolean;
    errored: boolean;
  }): void {
    if (!result) return;

    if (result.solved) {
      this.captchaClickGuardRemaining = 3;
      this.agentClient.addContextNote(CAPTCHA_SOLVED_MSG);
      this.logger({
        category: "agent",
        message: "Captcha solved — continuing with task",
        level: 1,
      });
    }

    if (result.errored) {
      this.captchaClickGuardRemaining = 0;
      this.agentClient.addContextNote(CAPTCHA_ERRORED_MSG);
      this.logger({
        category: "agent",
        message: "Captcha solver failed or errored",
        level: 1,
      });
    }
  }

  private async shouldSkipSolvedCaptchaInteraction(
    action: AgentAction,
  ): Promise<boolean> {
    if (this.captchaClickGuardRemaining <= 0) {
      return false;
    }

    if (action.type !== "click") {
      return false;
    }

    const x = action.x;
    const y = action.y;
    if (typeof x !== "number" || typeof y !== "number") {
      return false;
    }

    try {
      const page = await this.v3.context.awaitActivePage();
      const boxes = await page.evaluate<
        Array<{ left: number; top: number; right: number; bottom: number }>
      >(() => {
        const selectors = [
          'iframe[title*="reCAPTCHA"]',
          'iframe[src*="recaptcha"]',
          'iframe[src*="hcaptcha"]',
          'iframe[src*="turnstile"]',
          ".g-recaptcha",
          "[data-sitekey]",
          '[class*="captcha"]',
          '[id*="captcha"]',
        ];

        const seen = new Set<Element>();
        const bounds: Array<{
          left: number;
          top: number;
          right: number;
          bottom: number;
        }> = [];

        for (const selector of selectors) {
          for (const element of document.querySelectorAll(selector)) {
            if (seen.has(element)) continue;
            seen.add(element);
            const rect = element.getBoundingClientRect();
            if (rect.width <= 0 || rect.height <= 0) continue;
            bounds.push({
              left: rect.left,
              top: rect.top,
              right: rect.right,
              bottom: rect.bottom,
            });
          }
        }

        return bounds;
      });

      return boxes.some(
        (box) =>
          x >= box.left && x <= box.right && y >= box.top && y <= box.bottom,
      );
    } catch {
      return false;
    }
  }

  private async injectCursor(): Promise<void> {
    try {
      const page = await this.v3.context.awaitActivePage();
      await page.enableCursorOverlay();
    } catch {
      // Best-effort only
    }
  }
}


================================================
FILE: packages/core/lib/v3/index.ts
================================================
import * as PublicApi from "./types/public/index.js";
import { V3 } from "./v3.js";
import { AnnotatedScreenshotText, LLMClient } from "./llm/LLMClient.js";
import {
  AgentProvider,
  modelToAgentProviderMap,
} from "./agent/AgentProvider.js";
import {
  validateZodSchema,
  isRunningInBun,
  toGeminiSchema,
  getZodType,
  transformSchema,
  injectUrls,
  providerEnvVarMap,
  loadApiKeyFromEnv,
  trimTrailingTextNode,
  jsonSchemaToZod,
} from "../utils.js";
import { isZod4Schema, isZod3Schema, toJsonSchema } from "./zodCompat.js";
import { connectToMCPServer } from "./mcp/connection.js";
import { V3Evaluator } from "../v3Evaluator.js";
import { tool } from "ai";
import { getAISDKLanguageModel } from "./llm/LLMProvider.js";
import { __internalCreateInMemoryAgentCacheHandle } from "./cache/serverAgentCache.js";
import { maybeRunShutdownSupervisorFromArgv } from "./shutdown/supervisor.js";

export { V3 } from "./v3.js";
export { V3 as Stagehand } from "./v3.js";

export * from "./types/public/index.js";
export { AnnotatedScreenshotText, LLMClient } from "./llm/LLMClient.js";

export {
  AgentProvider,
  modelToAgentProviderMap,
} from "./agent/AgentProvider.js";
export type {
  AgentTools,
  AgentToolTypesMap,
  AgentUITools,
  AgentToolCall,
  AgentToolResult,
} from "./agent/tools/index.js";

export {
  validateZodSchema,
  isRunningInBun,
  toGeminiSchema,
  getZodType,
  transformSchema,
  injectUrls,
  providerEnvVarMap,
  loadApiKeyFromEnv,
  trimTrailingTextNode,
  jsonSchemaToZod,
} from "../utils.js";
export { isZod4Schema, isZod3Schema, toJsonSchema } from "./zodCompat.js";

export { connectToMCPServer } from "./mcp/connection.js";
export { V3Evaluator } from "../v3Evaluator.js";
export { tool } from "ai";
export { getAISDKLanguageModel } from "./llm/LLMProvider.js";
export { __internalCreateInMemoryAgentCacheHandle } from "./cache/serverAgentCache.js";
export { maybeRunShutdownSupervisorFromArgv as __internalMaybeRunShutdownSupervisorFromArgv } from "./shutdown/supervisor.js";
export type { ServerAgentCacheHandle } from "./cache/serverAgentCache.js";

export type {
  ChatMessage,
  ChatMessageContent,
  ChatMessageImageContent,
  ChatMessageTextContent,
  ChatCompletionOptions,
  LLMResponse,
  CreateChatCompletionOptions,
  LLMUsage,
  LLMParsedResponse,
} from "./llm/LLMClient.js";

export type {
  StagehandZodSchema,
  StagehandZodObject,
  InferStagehandSchema,
  JsonSchemaDocument,
} from "./zodCompat.js";

export type { JsonSchema, JsonSchemaProperty } from "../utils.js";

const StagehandDefault = {
  ...PublicApi,
  V3,
  Stagehand: V3,
  AnnotatedScreenshotText,
  LLMClient,
  AgentProvider,
  modelToAgentProviderMap,
  validateZodSchema,
  isRunningInBun,
  toGeminiSchema,
  getZodType,
  transformSchema,
  injectUrls,
  providerEnvVarMap,
  loadApiKeyFromEnv,
  trimTrailingTextNode,
  jsonSchemaToZod,
  isZod4Schema,
  isZod3Schema,
  toJsonSchema,
  connectToMCPServer,
  V3Evaluator,
  tool,
  getAISDKLanguageModel,
  __internalCreateInMemoryAgentCacheHandle,
  __internalMaybeRunShutdownSupervisorFromArgv:
    maybeRunShutdownSupervisorFromArgv,
};

export default StagehandDefault;


================================================
FILE: packages/core/lib/v3/launch/browserbase.ts
================================================
import Browserbase from "@browserbasehq/sdk";
import {
  BrowserbaseSessionNotFoundError,
  StagehandInitError,
} from "../types/public/sdkErrors.js";
import type { BrowserbaseSessionCreateParams } from "../types/public/api.js";
import { getEnvTimeoutMs, withTimeout } from "../timeoutConfig.js";

export async function createBrowserbaseSession(
  apiKey: string,
  projectId?: string,
  params?: BrowserbaseSessionCreateParams,
  resumeSessionId?: string,
): Promise<{ ws: string; sessionId: string; bb: Browserbase }> {
  const bb = new Browserbase({ apiKey });
  const sessionCreateTimeoutMs = getEnvTimeoutMs(
    "BROWSERBASE_SESSION_CREATE_MAX_MS",
  );

  // Resume an existing session if provided
  if (resumeSessionId) {
    const existing = (await withTimeout(
      bb.sessions.retrieve(resumeSessionId),
      sessionCreateTimeoutMs,
      "Browserbase session retrieve",
    )) as unknown as {
      id: string;
      connectUrl?: string;
      status?: string;
    };
    if (!existing?.id) {
      throw new BrowserbaseSessionNotFoundError();
    }

    const ws = existing.connectUrl;
    if (!ws) {
      throw new StagehandInitError(
        `Browserbase session resume missing connectUrl for ${resumeSessionId}`,
      );
    }
    return { ws, sessionId: resumeSessionId, bb };
  }

  // Create a new session with optional overrides and a default viewport
  const {
    projectId: overrideProjectId,
    browserSettings,
    userMetadata,
    ...rest
  } = params ?? {};

  // satisfies check ensures our BrowserbaseSessionCreateParamsSchema stays in sync with SDK
  const resolvedProjectId = overrideProjectId ?? projectId;
  const createPayload = {
    ...(resolvedProjectId ? { projectId: resolvedProjectId } : {}),
    ...rest,
    browserSettings: {
      ...(browserSettings ?? {}),
      viewport: browserSettings?.viewport ?? { width: 1288, height: 711 },
    },
    userMetadata: {
      ...(userMetadata ?? {}),
      stagehand: "true",
    },
  } satisfies Browserbase.Sessions.SessionCreateParams;

  const created = (await withTimeout(
    bb.sessions.create(createPayload),
    sessionCreateTimeoutMs,
    "Browserbase session create",
  )) as unknown as { id: string; connectUrl: string };

  if (!created?.connectUrl || !created?.id) {
    throw new StagehandInitError(
      "Browserbase session creation returned an unexpected shape.",
    );
  }

  return { ws: created.connectUrl, sessionId: created.id, bb };
}


================================================
FILE: packages/core/lib/v3/launch/local.ts
================================================
import { launch, LaunchedChrome } from "chrome-launcher";
import WebSocket from "ws";
import { ConnectionTimeoutError } from "../types/public/sdkErrors.js";

interface LaunchLocalOptions {
  chromePath?: string;
  chromeFlags?: string[];
  headless?: boolean;
  userDataDir?: string;
  port?: number;
  connectTimeoutMs?: number;
  handleSIGINT?: boolean;
}

export async function launchLocalChrome(
  opts: LaunchLocalOptions,
): Promise<{ ws: string; chrome: LaunchedChrome }> {
  const connectTimeoutMs = opts.connectTimeoutMs ?? 15_000;
  const deadlineMs = Date.now() + connectTimeoutMs;
  const connectionPollInterval = 250;
  const maxConnectionRetries = Math.max(
    1,
    Math.ceil(connectTimeoutMs / connectionPollInterval),
  );
  const headless = opts.headless ?? false;
  const chromeFlags = [
    headless ? "--headless=new" : undefined,
    "--remote-allow-origins=*",
    "--no-first-run",
    "--no-default-browser-check",
    "--disable-dev-shm-usage",
    "--site-per-process",
    ...(opts.chromeFlags ?? []),
  ].filter((f): f is string => typeof f === "string");

  const chrome = await launch({
    chromePath: opts.chromePath,
    chromeFlags,
    port: opts.port,
    userDataDir: opts.userDataDir,
    handleSIGINT: opts.handleSIGINT,
    connectionPollInterval,
    maxConnectionRetries,
  });

  const ws = await waitForWebSocketDebuggerUrl(chrome.port, deadlineMs);
  await waitForWebSocketReady(ws, deadlineMs);

  return { ws, chrome };
}

async function waitForWebSocketDebuggerUrl(
  port: number,
  deadlineMs: number,
): Promise<string> {
  let lastErrMsg = "";

  while (Date.now() < deadlineMs) {
    try {
      const resp = await fetch(`http://127.0.0.1:${port}/json/version`);
      if (resp.ok) {
        const json = (await resp.json()) as unknown;
        const url = (json as { webSocketDebuggerUrl?: string })
          .webSocketDebuggerUrl;
        if (typeof url === "string") return url;
      } else {
        lastErrMsg = `${resp.status} ${resp.statusText}`;
      }
    } catch (err) {
      lastErrMsg = err instanceof Error ? err.message : String(err);
    }
    await new Promise((r) => setTimeout(r, 250));
  }

  throw new ConnectionTimeoutError(
    `Timed out waiting for /json/version on port ${port} ${
      lastErrMsg ? ` (last error: ${lastErrMsg})` : ""
    }`,
  );
}

async function waitForWebSocketReady(
  wsUrl: string,
  deadlineMs: number,
): Promise<void> {
  let lastErrMsg = "";
  while (Date.now() < deadlineMs) {
    const remainingMs = Math.max(200, deadlineMs - Date.now());
    try {
      await probeWebSocket(wsUrl, Math.min(2_000, remainingMs));
      return;
    } catch (error) {
      lastErrMsg = error instanceof Error ? error.message : String(error);
      await new Promise((r) => setTimeout(r, 100));
    }
  }
  throw new ConnectionTimeoutError(
    `Timed out waiting for CDP websocket to accept connections at ${wsUrl}${
      lastErrMsg ? ` (last error: ${lastErrMsg})` : ""
    }`,
  );
}

function probeWebSocket(wsUrl: string, timeoutMs: number): Promise<void> {
  return new Promise((resolve, reject) => {
    const ws = new WebSocket(wsUrl);
    let settled = false;
    const finish = (error?: unknown) => {
      if (settled) return;
      settled = true;
      clearTimeout(timer);
      try {
        ws.terminate();
      } catch {
        // best-effort cleanup
      }
      if (error) {
        reject(error);
        return;
      }
      resolve();
    };
    const timer = setTimeout(() => {
      finish(new Error(`websocket probe timeout after ${timeoutMs}ms`));
    }, timeoutMs);

    ws.once("open", () => finish());
    ws.once("error", (error) => finish(error));
  });
}


================================================
FILE: packages/core/lib/v3/llm/AnthropicClient.ts
================================================
import Anthropic, { ClientOptions } from "@anthropic-ai/sdk";
import {
  ImageBlockParam,
  MessageParam,
  TextBlockParam,
  Tool,
} from "@anthropic-ai/sdk/resources";
import { LogLine } from "../types/public/logs.js";
import {
  AnthropicJsonSchemaObject,
  AvailableModel,
} from "../types/public/model.js";
import {
  CreateChatCompletionOptions,
  LLMClient,
  LLMResponse,
} from "./LLMClient.js";
import { CreateChatCompletionResponseError } from "../types/public/sdkErrors.js";
import { toJsonSchema } from "../zodCompat.js";

export class AnthropicClient extends LLMClient {
  public type = "anthropic" as const;
  private client: Anthropic;
  declare public clientOptions: ClientOptions;

  constructor({
    modelName,
    clientOptions,
    userProvidedInstructions,
  }: {
    logger: (message: LogLine) => void;
    modelName: AvailableModel;
    clientOptions?: ClientOptions;
    userProvidedInstructions?: string;
  }) {
    super(modelName);
    this.client = new Anthropic(clientOptions);
    this.modelName = modelName;
    this.clientOptions = clientOptions;
    this.userProvidedInstructions = userProvidedInstructions;
  }

  async createChatCompletion<T = LLMResponse>({
    options,
    retries,
    logger,
  }: CreateChatCompletionOptions): Promise<T> {
    const optionsWithoutImage = { ...options };
    delete optionsWithoutImage.image;

    logger({
      category: "anthropic",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        options: {
          value: JSON.stringify(optionsWithoutImage),
          type: "object",
        },
      },
    });

    const systemMessage = options.messages.find((msg) => {
      if (msg.role === "system") {
        if (typeof msg.content === "string") {
          return true;
        } else if (Array.isArray(msg.content)) {
          return msg.content.every((content) => content.type !== "image_url");
        }
      }
      return false;
    });

    const userMessages = options.messages.filter(
      (msg) => msg.role !== "system",
    );

    const formattedMessages: MessageParam[] = userMessages.map((msg) => {
      if (typeof msg.content === "string") {
        return {
          role: msg.role as "user" | "assistant", // ensure its not checking for system types
          content: msg.content,
        };
      } else {
        return {
          role: msg.role as "user" | "assistant",
          content: msg.content.map((content) => {
            if ("image_url" in content) {
              const formattedContent: ImageBlockParam = {
                type: "image",
                source: {
                  type: "base64",
                  media_type: "image/jpeg",
                  data: content.image_url.url,
                },
              };

              return formattedContent;
            } else {
              return { type: "text", text: content.text };
            }
          }),
        };
      }
    });

    if (options.image) {
      const screenshotMessage: MessageParam = {
        role: "user",
        content: [
          {
            type: "image",
            source: {
              type: "base64",
              media_type: "image/jpeg",
              data: options.image.buffer.toString("base64"),
            },
          },
        ],
      };
      if (
        options.image.description &&
        Array.isArray(screenshotMessage.content)
      ) {
        screenshotMessage.content.push({
          type: "text",
          text: options.image.description,
        });
      }

      formattedMessages.push(screenshotMessage);
    }

    let anthropicTools: Tool[] = options.tools?.map((tool) => {
      return {
        name: tool.name,
        description: tool.description,
        input_schema: {
          type: "object",
          properties: tool.parameters.properties,
          required: tool.parameters.required,
        },
      };
    });

    let toolDefinition: Tool | undefined;
    if (options.response_model) {
      const jsonSchema = toJsonSchema(options.response_model.schema);
      const { properties: schemaProperties, required: schemaRequired } =
        extractSchemaProperties(jsonSchema);

      toolDefinition = {
        name: "print_extracted_data",
        description: "Prints the extracted data based on the provided schema.",
        input_schema: {
          type: "object",
          properties: schemaProperties,
          required: schemaRequired,
        },
      };
    }

    if (toolDefinition) {
      anthropicTools = anthropicTools ?? [];
      anthropicTools.push(toolDefinition);
    }

    const response = await this.client.messages.create({
      model: this.modelName,
      max_tokens: options.maxOutputTokens || 8192,
      messages: formattedMessages,
      tools: anthropicTools,
      system: systemMessage
        ? (systemMessage.content as string | TextBlockParam[]) // we can cast because we already filtered out image content
        : undefined,
      temperature: options.temperature,
    });

    logger({
      category: "anthropic",
      message: "response",
      level: 2,
      auxiliary: {
        response: {
          value: JSON.stringify(response),
          type: "object",
        },
        requestId: {
          value: options.requestId,
          type: "string",
        },
      },
    });

    // We'll compute usage data from the response
    const usageData = {
      prompt_tokens: response.usage.input_tokens,
      completion_tokens: response.usage.output_tokens,
      total_tokens: response.usage.input_tokens + response.usage.output_tokens,
    };

    const transformedResponse: LLMResponse = {
      id: response.id,
      object: "chat.completion",
      created: Date.now(),
      model: response.model,
      choices: [
        {
          index: 0,
          message: {
            role: "assistant",
            content:
              response.content.find((c) => c.type === "text")?.text || null,
            tool_calls: response.content
              .filter((c) => c.type === "tool_use")
              .map((toolUse) => ({
                id: toolUse.id,
                type: "function",
                function: {
                  name: toolUse.name,
                  arguments: JSON.stringify(toolUse.input),
                },
              })),
          },
          finish_reason: response.stop_reason,
        },
      ],
      usage: usageData,
    };

    logger({
      category: "anthropic",
      message: "transformed response",
      level: 2,
      auxiliary: {
        transformedResponse: {
          value: JSON.stringify(transformedResponse),
          type: "object",
        },
        requestId: {
          value: options.requestId,
          type: "string",
        },
      },
    });

    if (options.response_model) {
      const toolUse = response.content.find((c) => c.type === "tool_use");
      if (toolUse && "input" in toolUse) {
        const result = toolUse.input;

        const finalParsedResponse = {
          data: result,
          usage: usageData,
        } as unknown as T;

        return finalParsedResponse;
      } else {
        if (!retries || retries < 5) {
          return this.createChatCompletion({
            options,
            logger,
            retries: (retries ?? 0) + 1,
          });
        }
        logger({
          category: "anthropic",
          message: "error creating chat completion",
          level: 0,
          auxiliary: {
            requestId: {
              value: options.requestId,
              type: "string",
            },
          },
        });
        throw new CreateChatCompletionResponseError(
          "No tool use with input in response",
        );
      }
    }

    // if the function was called with a response model, it would have returned earlier
    // so we can safely cast here to T, which defaults to AnthropicTransformedResponse
    return transformedResponse as T;
  }
}

const extractSchemaProperties = (jsonSchema: AnthropicJsonSchemaObject) => {
  const schemaRoot = jsonSchema.definitions?.MySchema || jsonSchema;

  return {
    properties: schemaRoot.properties,
    required: schemaRoot.required,
  };
};


================================================
FILE: packages/core/lib/v3/llm/CerebrasClient.ts
================================================
import OpenAI from "openai";
import type { ClientOptions } from "openai";
import { LogLine } from "../types/public/logs.js";
import { AvailableModel } from "../types/public/model.js";
import {
  ChatMessage,
  CreateChatCompletionOptions,
  LLMClient,
  LLMResponse,
} from "./LLMClient.js";
import { CreateChatCompletionResponseError } from "../types/public/sdkErrors.js";
import { toJsonSchema } from "../zodCompat.js";

export class CerebrasClient extends LLMClient {
  public type = "cerebras" as const;
  private client: OpenAI;
  declare public clientOptions: ClientOptions;
  public hasVision = false;

  constructor({
    modelName,
    clientOptions,
    userProvidedInstructions,
  }: {
    logger: (message: LogLine) => void;
    modelName: AvailableModel;
    clientOptions?: ClientOptions;
    userProvidedInstructions?: string;
  }) {
    super(modelName, userProvidedInstructions);

    // Create OpenAI client with the base URL set to Cerebras API
    this.client = new OpenAI({
      baseURL: "https://api.cerebras.ai/v1",
      apiKey: clientOptions?.apiKey || process.env.CEREBRAS_API_KEY,
      ...clientOptions,
    });

    this.modelName = modelName;
    this.clientOptions = clientOptions;
  }

  async createChatCompletion<T = LLMResponse>({
    options,
    retries,
    logger,
  }: CreateChatCompletionOptions): Promise<T> {
    const optionsWithoutImage = { ...options };
    delete optionsWithoutImage.image;

    logger({
      category: "cerebras",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        options: {
          value: JSON.stringify(optionsWithoutImage),
          type: "object",
        },
      },
    });

    // Format messages for Cerebras API (using OpenAI format)
    const formattedMessages = options.messages.map((msg: ChatMessage) => {
      const baseMessage = {
        content:
          typeof msg.content === "string"
            ? msg.content
            : Array.isArray(msg.content) &&
                msg.content.length > 0 &&
                "text" in msg.content[0]
              ? msg.content[0].text
              : "",
      };

      // Cerebras only supports system, user, and assistant roles
      if (msg.role === "system") {
        return { ...baseMessage, role: "system" as const };
      } else if (msg.role === "assistant") {
        return { ...baseMessage, role: "assistant" as const };
      } else {
        // Default to user for any other role
        return { ...baseMessage, role: "user" as const };
      }
    });

    // Format tools if provided
    let tools = options.tools?.map((tool) => ({
      type: "function" as const,
      function: {
        name: tool.name,
        description: tool.description,
        parameters: {
          type: "object",
          properties: tool.parameters.properties,
          required: tool.parameters.required,
        },
      },
    }));

    // Add response model as a tool if provided
    if (options.response_model) {
      const jsonSchema = toJsonSchema(options.response_model.schema) as {
        properties?: Record<string, unknown>;
        required?: string[];
      };
      const schemaProperties = jsonSchema.properties || {};
      const schemaRequired = jsonSchema.required || [];

      const responseTool = {
        type: "function" as const,
        function: {
          name: "print_extracted_data",
          description:
            "Prints the extracted data based on the provided schema.",
          parameters: {
            type: "object",
            properties: schemaProperties,
            required: schemaRequired,
          },
        },
      };

      tools = tools ? [...tools, responseTool] : [responseTool];
    }

    try {
      // Use OpenAI client with Cerebras API
      const apiResponse = await this.client.chat.completions.create({
        model: this.modelName.split("cerebras-")[1],
        messages: [
          ...formattedMessages,
          // Add explicit instruction to return JSON if we have a response model
          ...(options.response_model
            ? [
                {
                  role: "system" as const,
                  content: `IMPORTANT: Your response must be valid JSON that matches this schema: ${JSON.stringify(
                    options.response_model.schema,
                  )}`,
                },
              ]
            : []),
        ],
        temperature: options.temperature || 0.7,
        max_tokens: options.maxOutputTokens,
        tools: tools,
        tool_choice: options.tool_choice || "auto",
      });

      // Format the response to match the expected LLMResponse format
      const response: LLMResponse = {
        id: apiResponse.id,
        object: "chat.completion",
        created: Date.now(),
        model: this.modelName.split("cerebras-")[1],
        choices: [
          {
            index: 0,
            message: {
              role: "assistant",
              content: apiResponse.choices[0]?.message?.content || null,
              tool_calls: apiResponse.choices[0]?.message?.tool_calls || [],
            },
            finish_reason: apiResponse.choices[0]?.finish_reason || "stop",
          },
        ],
        usage: {
          prompt_tokens: apiResponse.usage?.prompt_tokens || 0,
          completion_tokens: apiResponse.usage?.completion_tokens || 0,
          total_tokens: apiResponse.usage?.total_tokens || 0,
        },
      };

      logger({
        category: "cerebras",
        message: "response",
        level: 2,
        auxiliary: {
          response: {
            value: JSON.stringify(response),
            type: "object",
          },
          requestId: {
            value: options.requestId,
            type: "string",
          },
        },
      });

      // If we have no response model, just return the entire LLMResponse
      if (!options.response_model) {
        return response as T;
      }

      // If we have a response model, parse JSON from tool calls or content
      const toolCall = response.choices[0]?.message?.tool_calls?.[0];
      if (toolCall?.function?.arguments) {
        try {
          const result = JSON.parse(toolCall.function.arguments);
          const finalResponse = {
            data: result,
            usage: response.usage,
          };
          return finalResponse as T;
        } catch (e) {
          logger({
            category: "cerebras",
            message: "failed to parse tool call arguments as JSON, retrying",
            level: 0,
            auxiliary: {
              error: {
                value: e.message,
                type: "string",
              },
            },
          });
        }
      }

      // If we have content but no tool calls, try to parse the content as JSON
      const content = response.choices[0]?.message?.content;
      if (content) {
        try {
          const jsonMatch = content.match(/\{[\s\S]*\}/);
          if (jsonMatch) {
            const result = JSON.parse(jsonMatch[0]);
            const finalResponse = {
              data: result,
              usage: response.usage,
            };
            return finalResponse as T;
          }
        } catch (e) {
          logger({
            category: "cerebras",
            message: "failed to parse content as JSON",
            level: 0,
            auxiliary: {
              error: {
                value: e.message,
                type: "string",
              },
            },
          });
        }
      }

      // If we still haven't found valid JSON and have retries left, try again
      if (!retries || retries < 5) {
        return this.createChatCompletion({
          options,
          logger,
          retries: (retries ?? 0) + 1,
        });
      }

      throw new CreateChatCompletionResponseError("Invalid response schema");
    } catch (error) {
      logger({
        category: "cerebras",
        message: "error creating chat completion",
        level: 0,
        auxiliary: {
          error: {
            value: error.message,
            type: "string",
          },
          requestId: {
            value: options.requestId,
            type: "string",
          },
        },
      });
      throw error;
    }
  }
}


================================================
FILE: packages/core/lib/v3/llm/GoogleClient.ts
================================================
import {
  GoogleGenAI,
  HarmCategory,
  HarmBlockThreshold,
  Content,
  Part,
  Tool,
  FunctionCall,
  Schema,
  Type,
} from "@google/genai";

import { LogLine } from "../types/public/logs.js";
import { AvailableModel, ClientOptions } from "../types/public/model.js";
import {
  validateZodSchema,
  toGeminiSchema,
  loadApiKeyFromEnv,
} from "../../utils.js";
import {
  ChatCompletionOptions,
  ChatMessage,
  CreateChatCompletionOptions,
  LLMClient,
  LLMResponse,
  AnnotatedScreenshotText,
} from "./LLMClient.js";
import {
  CreateChatCompletionResponseError,
  StagehandError,
} from "../types/public/sdkErrors.js";

// Mapping from generic roles to Gemini roles
const roleMap: { [key in ChatMessage["role"]]: string } = {
  user: "user",
  assistant: "model",
  system: "user", // Gemini API prefers system instructions either via system_instruction or at the start of 'user' content
};

// Basic safety settings - adjust as needed
const safetySettings = [
  {
    category: HarmCategory.HARM_CATEGORY_HARASSMENT,
    threshold: HarmBlockThreshold.BLOCK_MEDIUM_AND_ABOVE,
  },
  {
    category: HarmCategory.HARM_CATEGORY_HATE_SPEECH,
    threshold: HarmBlockThreshold.BLOCK_MEDIUM_AND_ABOVE,
  },
  {
    category: HarmCategory.HARM_CATEGORY_SEXUALLY_EXPLICIT,
    threshold: HarmBlockThreshold.BLOCK_MEDIUM_AND_ABOVE,
  },
  {
    category: HarmCategory.HARM_CATEGORY_DANGEROUS_CONTENT,
    threshold: HarmBlockThreshold.BLOCK_MEDIUM_AND_ABOVE,
  },
];

export class GoogleClient extends LLMClient {
  public type = "google" as const;
  private client: GoogleGenAI;
  declare public clientOptions: ClientOptions;
  declare public hasVision: boolean;
  private logger: (message: LogLine) => void;

  constructor({
    logger, // Added logger based on other clients
    modelName,
    clientOptions,
  }: {
    logger: (message: LogLine) => void; // Added logger type
    modelName: AvailableModel;
    clientOptions?: ClientOptions; // Expecting { apiKey: string } here
  }) {
    super(modelName);
    if (!clientOptions?.apiKey) {
      // Try to get the API key from the environment variable GOOGLE_API_KEY
      clientOptions.apiKey = loadApiKeyFromEnv("google_legacy", logger);
    }
    this.clientOptions = clientOptions;
    this.client = new GoogleGenAI({ apiKey: clientOptions.apiKey });
    this.modelName = modelName;
    this.logger = logger;
    // Determine vision capability based on model name (adjust as needed)
    this.hasVision =
      modelName.includes("vision") || modelName.includes("gemini-1.5"); // Example logic
  }

  // Helper to convert project's ChatMessage[] to Gemini's Content[]
  private formatMessages(
    messages: ChatMessage[],
    image?: ChatCompletionOptions["image"],
  ): Content[] {
    const contents: Content[] = [];
    let systemInstruction: string | null = null;

    messages.forEach((msg, index) => {
      const role = roleMap[msg.role];
      if (!role) {
        this.logger({
          category: "google",
          message: `WARNING: Unsupported role: ${msg.role}`,
          level: 1,
        });
        return; // Skip unsupported roles
      }

      // Handle system messages - prepend to the first user message or use system_instruction if available
      if (msg.role === "system") {
        if (typeof msg.content === "string") {
          systemInstruction =
            (systemInstruction ? systemInstruction + "\n\n" : "") + msg.content;
        }
        return; // Don't add system messages directly to contents yet
      }

      const parts: Part[] = [];

      if (Array.isArray(msg.content)) {
        msg.content.forEach((partContent) => {
          if (partContent.type === "text") {
            parts.push({ text: partContent.text });
          } else if (partContent.type === "image_url") {
            if ("image_url" in partContent && partContent.image_url?.url) {
              // Assuming base64 data URI format: data:[<mediatype>];base64,<data>
              const base64Data = partContent.image_url.url.split(",")[1];
              const mimeTypeMatch = partContent.image_url.url.match(
                /^data:(image\/\w+);base64,/,
              );
              if (base64Data && mimeTypeMatch) {
                parts.push({
                  inlineData: { mimeType: mimeTypeMatch[1], data: base64Data },
                });
              } else {
                this.logger({
                  category: "google",
                  message: "WARNING: Could not parse image data URI format",
                  level: 1,
                });
              }
            }
          }
        });
      } else if (typeof msg.content === "string") {
        parts.push({ text: msg.content });
      }

      // Add image from options if this is the last message and it's a user message
      if (image && index === messages.length - 1 && msg.role === "user") {
        const imageDesc = image.description || AnnotatedScreenshotText;
        parts.push({ text: imageDesc }); // Add description first
        parts.push({
          inlineData: {
            mimeType: "image/jpeg", // Assuming JPEG, adjust if needed
            data: image.buffer.toString("base64"),
          },
        });
      }

      // Apply system instruction to the first non-system message if needed
      if (systemInstruction && contents.length === 0 && role === "user") {
        const firstPartText = parts.find((p) => "text" in p);
        if (firstPartText && "text" in firstPartText) {
          firstPartText.text = `${systemInstruction}\n\n${firstPartText.text}`;
        } else {
          parts.unshift({ text: systemInstruction });
        }
        systemInstruction = null; // Clear after applying
      }

      if (parts.length > 0) {
        contents.push({ role, parts });
      }
    });

    // If system instruction wasn't applied (e.g., no user messages followed it), add it as a final user message
    if (systemInstruction) {
      contents.unshift({ role: "user", parts: [{ text: systemInstruction }] });
    }

    return contents;
  }

  // Helper to convert LLMTool[] to Gemini's Tool[]
  private formatTools(
    tools?: ChatCompletionOptions["tools"],
  ): Tool[] | undefined {
    if (!tools || tools.length === 0) {
      return undefined;
    }

    return [
      {
        functionDeclarations: tools.map((tool) => {
          let parameters: Schema | undefined = undefined;
          if (tool.parameters) {
            parameters = {
              type: Type.OBJECT,
              properties: tool.parameters.properties as {
                [key: string]: Schema;
              },
              required: tool.parameters.required as string[] | undefined,
            };
          }
          return {
            name: tool.name,
            description: tool.description,
            parameters: parameters,
          };
        }),
      },
    ];
  }

  async createChatCompletion<T = LLMResponse>({
    // Ensure LLMResponse is compatible
    options,
    logger,
    retries = 3,
  }: CreateChatCompletionOptions): Promise<T> {
    const {
      image,
      requestId,
      response_model,
      tools,
      temperature,
      top_p,
      maxOutputTokens,
    } = options;

    const formattedMessages = this.formatMessages(options.messages, image);
    const formattedTools = this.formatTools(tools);

    const generationConfig = {
      maxOutputTokens: maxOutputTokens,
      temperature: temperature,
      topP: top_p,
      responseMimeType: response_model ? "application/json" : undefined,
      responseSchema: response_model
        ? toGeminiSchema(response_model.schema)
        : undefined,
    };

    logger({
      category: "google",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        modelName: { value: this.modelName, type: "string" },
        requestId: { value: requestId, type: "string" },
        requestPayloadSummary: {
          value: `Model: ${this.modelName}, Messages: ${formattedMessages.length}, Config Keys: ${Object.keys(generationConfig).join(", ")}, Tools: ${formattedTools ? formattedTools.length : 0}, Safety Categories: ${safetySettings.map((s) => s.category).join(", ")}`,
          type: "string",
        },
      },
    });

    // Construct the full request object
    const requestPayload = {
      model: this.modelName,
      contents: formattedMessages,
      config: {
        ...generationConfig,
        safetySettings: safetySettings,
        tools: formattedTools,
      },
    };

    // Log the full payload safely
    try {
      logger({
        category: "google",
        message: "Full request payload",
        level: 2,
        auxiliary: {
          requestId: { value: requestId, type: "string" },
          fullPayload: {
            value: JSON.stringify(requestPayload),
            type: "object",
          },
        },
      });
    } catch (e) {
      logger({
        category: "google",
        message: "Failed to stringify full request payload for logging",
        level: 0,
        auxiliary: {
          requestId: { value: requestId, type: "string" },
          error: { value: e.message, type: "string" },
        },
      });
    }

    try {
      const result = await this.client.models.generateContent(requestPayload); // Pass the constructed payload

      logger({
        category: "google",
        message: "received response",
        level: 2,
        auxiliary: {
          requestId: { value: requestId, type: "string" },
          response: {
            value: JSON.stringify(result),
            type: "object",
          },
        },
      });

      const finishReason = result.candidates?.[0]?.finishReason || "unknown";
      const toolCalls = result.functionCalls?.map(
        (fc: FunctionCall, index: number) => ({
          id: `tool_call_${requestId}_${index}`,
          type: "function" as const,
          function: {
            name: fc.name,
            arguments: JSON.stringify(fc.args),
          },
        }),
      );

      let content: string | null = null;
      try {
        content = result.text;
      } catch (e) {
        logger({
          category: "google",
          message: `Could not extract text content: ${e.message}`,
          level: 1,
          auxiliary: { requestId: { value: requestId, type: "string" } },
        });
        content = null;
      }

      // Construct LLMResponse shape
      const llmResponse: LLMResponse = {
        id: result.candidates?.[0]?.index?.toString() || requestId,
        object: "chat.completion",
        created: Math.floor(Date.now() / 1000),
        model: this.modelName,
        choices: [
          {
            index: 0,
            message: {
              role: "assistant",
              content: content,
              tool_calls: toolCalls,
            },
            finish_reason: finishReason,
          },
        ],
        usage: {
          prompt_tokens: result.usageMetadata?.promptTokenCount || 0,
          completion_tokens: result.usageMetadata?.candidatesTokenCount || 0,
          total_tokens: result.usageMetadata?.totalTokenCount || 0,
        },
      };

      // Validate schema if response_model was provided
      if (response_model) {
        let parsedData;
        try {
          // Need to handle potential markdown fences if the model didn't follow instructions perfectly
          const potentialJson =
            content?.trim().replace(/^```json\n?|\n?```$/g, "") || "{}";
          parsedData = JSON.parse(potentialJson);
        } catch (e) {
          logger({
            category: "google",
            message: `Failed to parse JSON response: ${e.message}`,
            level: 0,
            auxiliary: {
              content: { value: content || "null", type: "string" },
            },
          });
          if (retries > 0) {
            return this.createChatCompletion({
              options,
              logger,
              retries: retries - 1,
            });
          }
          throw new CreateChatCompletionResponseError(
            `Failed to parse JSON response: ${e.message}`,
          );
        }

        try {
          validateZodSchema(response_model.schema, parsedData);
        } catch (err) {
          logger({
            category: "google",
            message: "Response failed Zod schema validation",
            level: 0,
          });
          if (retries > 0) {
            return this.createChatCompletion({
              options,
              logger,
              retries: retries - 1,
            });
          }
          throw err;
        }

        // If schema validation passes, structure the response for extraction use case
        const extractionResult = {
          data: parsedData,
          usage: llmResponse.usage,
        };

        return extractionResult as T;
      }

      return llmResponse as T;
    } catch (error) {
      logger({
        category: "google",
        message: `Error during Google AI chat completion: ${error.message}`,
        level: 0,
        auxiliary: {
          errorDetails: {
            value: `Message: ${error.message}${error.stack ? "\nStack: " + error.stack : ""}`,
            type: "string",
          },
          requestId: { value: requestId, type: "string" },
        },
      });

      // Basic retry logic
      if (retries > 0) {
        logger({
          category: "google",
          message: `Retrying... (${retries} attempts left)`,
          level: 1,
        });
        await new Promise((resolve) =>
          setTimeout(resolve, 1000 * (4 - retries)),
        ); // Simple backoff
        return this.createChatCompletion({
          options,
          logger,
          retries: retries - 1,
        });
      }

      // Re-throw specific Stagehand errors or a generic one
      if (error instanceof StagehandError) {
        throw error;
      }
      throw new StagehandError(
        `Google AI API request failed: ${error.message}`,
      );
    }
  }
}


================================================
FILE: packages/core/lib/v3/llm/GroqClient.ts
================================================
import type { ClientOptions } from "openai";
import OpenAI from "openai";
import { LogLine } from "../types/public/logs.js";
import { AvailableModel } from "../types/public/model.js";
import {
  ChatMessage,
  CreateChatCompletionOptions,
  LLMClient,
  LLMResponse,
} from "./LLMClient.js";
import { CreateChatCompletionResponseError } from "../types/public/sdkErrors.js";
import { toJsonSchema } from "../zodCompat.js";

export class GroqClient extends LLMClient {
  public type = "groq" as const;
  private client: OpenAI;
  declare public clientOptions: ClientOptions;
  public hasVision = false;

  constructor({
    modelName,
    clientOptions,
    userProvidedInstructions,
  }: {
    logger: (message: LogLine) => void;
    modelName: AvailableModel;
    clientOptions?: ClientOptions;
    userProvidedInstructions?: string;
  }) {
    super(modelName, userProvidedInstructions);

    // Create OpenAI client with the base URL set to Groq API
    this.client = new OpenAI({
      baseURL: "https://api.groq.com/openai/v1",
      apiKey: clientOptions?.apiKey || process.env.GROQ_API_KEY,
      ...clientOptions,
    });

    this.modelName = modelName;
    this.clientOptions = clientOptions;
  }

  async createChatCompletion<T = LLMResponse>({
    options,
    retries,
    logger,
  }: CreateChatCompletionOptions): Promise<T> {
    const optionsWithoutImage = { ...options };
    delete optionsWithoutImage.image;

    logger({
      category: "groq",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        options: {
          value: JSON.stringify(optionsWithoutImage),
          type: "object",
        },
      },
    });

    // Format messages for Groq API (using OpenAI format)
    const formattedMessages = options.messages.map((msg: ChatMessage) => {
      const baseMessage = {
        content:
          typeof msg.content === "string"
            ? msg.content
            : Array.isArray(msg.content) &&
                msg.content.length > 0 &&
                "text" in msg.content[0]
              ? msg.content[0].text
              : "",
      };

      // Groq supports system, user, and assistant roles
      if (msg.role === "system") {
        return { ...baseMessage, role: "system" as const };
      } else if (msg.role === "assistant") {
        return { ...baseMessage, role: "assistant" as const };
      } else {
        // Default to user for any other role
        return { ...baseMessage, role: "user" as const };
      }
    });

    // Format tools if provided
    let tools = options.tools?.map((tool) => ({
      type: "function" as const,
      function: {
        name: tool.name,
        description: tool.description,
        parameters: {
          type: "object",
          properties: tool.parameters.properties,
          required: tool.parameters.required,
        },
      },
    }));

    // Add response model as a tool if provided
    if (options.response_model) {
      const jsonSchema = toJsonSchema(options.response_model.schema) as {
        properties?: Record<string, unknown>;
        required?: string[];
      };
      const schemaProperties = jsonSchema.properties || {};
      const schemaRequired = jsonSchema.required || [];

      const responseTool = {
        type: "function" as const,
        function: {
          name: "print_extracted_data",
          description:
            "Prints the extracted data based on the provided schema.",
          parameters: {
            type: "object",
            properties: schemaProperties,
            required: schemaRequired,
          },
        },
      };

      tools = tools ? [...tools, responseTool] : [responseTool];
    }

    try {
      // Use OpenAI client with Groq API
      const apiResponse = await this.client.chat.completions.create({
        model: this.modelName.split("groq-")[1],
        messages: [
          ...formattedMessages,
          // Add explicit instruction to return JSON if we have a response model
          ...(options.response_model
            ? [
                {
                  role: "system" as const,
                  content: `IMPORTANT: Your response must be valid JSON that matches this schema: ${JSON.stringify(
                    options.response_model.schema,
                  )}`,
                },
              ]
            : []),
        ],
        temperature: options.temperature || 0.7,
        max_tokens: options.maxOutputTokens,
        tools: tools,
        tool_choice: options.tool_choice || "auto",
      });

      // Format the response to match the expected LLMResponse format
      const response: LLMResponse = {
        id: apiResponse.id,
        object: "chat.completion",
        created: Date.now(),
        model: this.modelName.split("groq-")[1],
        choices: [
          {
            index: 0,
            message: {
              role: "assistant",
              content: apiResponse.choices[0]?.message?.content || null,
              tool_calls: apiResponse.choices[0]?.message?.tool_calls || [],
            },
            finish_reason: apiResponse.choices[0]?.finish_reason || "stop",
          },
        ],
        usage: {
          prompt_tokens: apiResponse.usage?.prompt_tokens || 0,
          completion_tokens: apiResponse.usage?.completion_tokens || 0,
          total_tokens: apiResponse.usage?.total_tokens || 0,
        },
      };

      logger({
        category: "groq",
        message: "response",
        level: 2,
        auxiliary: {
          response: {
            value: JSON.stringify(response),
            type: "object",
          },
          requestId: {
            value: options.requestId,
            type: "string",
          },
        },
      });

      // If there's no response model, return the entire response object
      if (!options.response_model) {
        return response as T;
      }

      // Otherwise, try parsing the JSON from the tool call or content
      const toolCall = response.choices[0]?.message?.tool_calls?.[0];
      if (toolCall?.function?.arguments) {
        try {
          const result = JSON.parse(toolCall.function.arguments);
          const finalResponse = {
            data: result,
            usage: response.usage,
          };
          return finalResponse as T;
        } catch (e) {
          logger({
            category: "groq",
            message: "failed to parse tool call arguments as JSON, retrying",
            level: 0,
            auxiliary: {
              error: {
                value: e.message,
                type: "string",
              },
            },
          });
        }
      }

      // If we have content but no tool calls, try to parse the content as JSON
      const content = response.choices[0]?.message?.content;
      if (content) {
        try {
          // Try to extract JSON from the content
          const jsonMatch = content.match(/\{[\s\S]*\}/);
          if (jsonMatch) {
            const result = JSON.parse(jsonMatch[0]);
            const finalResponse = {
              data: result,
              usage: response.usage,
            };
            return finalResponse as T;
          }
        } catch (e) {
          logger({
            category: "groq",
            message: "failed to parse content as JSON",
            level: 0,
            auxiliary: {
              error: {
                value: e.message,
                type: "string",
              },
            },
          });
        }
      }

      // If we still haven't found valid JSON and have retries left, try again
      if (!retries || retries < 5) {
        return this.createChatCompletion({
          options,
          logger,
          retries: (retries ?? 0) + 1,
        });
      }

      throw new CreateChatCompletionResponseError("Invalid response schema");
    } catch (error) {
      logger({
        category: "groq",
        message: "error creating chat completion",
        level: 0,
        auxiliary: {
          error: {
            value: error.message,
            type: "string",
          },
          requestId: {
            value: options.requestId,
            type: "string",
          },
        },
      });
      throw error;
    }
  }
}


================================================
FILE: packages/core/lib/v3/llm/LLMClient.ts
================================================
import { LLMTool } from "../types/public/model.js";
import {
  embed,
  embedMany,
  experimental_generateImage,
  experimental_generateSpeech,
  experimental_transcribe,
  generateObject,
  generateText,
  streamObject,
  streamText,
} from "ai";
import type { LanguageModelV2 } from "@ai-sdk/provider";
import { LogLine } from "../types/public/logs.js";
import { AvailableModel, ClientOptions } from "../types/public/model.js";
import type { StagehandZodSchema } from "../zodCompat.js";

export interface ChatMessage {
  role: "system" | "user" | "assistant";
  content: ChatMessageContent;
}

export type ChatMessageContent =
  | string
  | (ChatMessageImageContent | ChatMessageTextContent)[];

export interface ChatMessageImageContent {
  type: string;
  image_url?: { url: string };
  text?: string;
  source?: {
    type: string;
    media_type: string;
    data: string;
  };
}

export interface ChatMessageTextContent {
  type: string;
  text: string;
}

export const AnnotatedScreenshotText =
  "This is a screenshot of the current page state with the elements annotated on it. Each element id is annotated with a number to the top left of it. Duplicate annotations at the same location are under each other vertically.";

export interface ChatCompletionOptions {
  messages: ChatMessage[];
  temperature?: number;
  top_p?: number;
  frequency_penalty?: number;
  presence_penalty?: number;
  image?: {
    buffer: Buffer;
    description?: string;
  };
  response_model?: {
    name: string;
    schema: StagehandZodSchema;
  };
  tools?: LLMTool[];
  tool_choice?: "auto" | "none" | "required";
  maxOutputTokens?: number;
  requestId?: string;
}

export type LLMResponse = {
  id: string;
  object: string;
  created: number;
  model: string;
  choices: {
    index: number;
    message: {
      role: string;
      content: string | null;
      tool_calls: {
        id: string;
        type: string;
        function: {
          name: string;
          arguments: string;
        };
      }[];
    };
    finish_reason: string;
  }[];
  usage: {
    prompt_tokens: number;
    completion_tokens: number;
    total_tokens: number;
  };
};

export interface CreateChatCompletionOptions {
  options: ChatCompletionOptions;
  logger: (message: LogLine) => void;
  retries?: number;
}

/** Simple usage shape if your LLM returns usage tokens. */
export interface LLMUsage {
  prompt_tokens: number;
  completion_tokens: number;
  total_tokens: number;
  reasoning_tokens?: number;
  cached_input_tokens?: number;
}

/**
 * For calls that use a schema: the LLMClient may return { data: T; usage?: LLMUsage }
 */
export interface LLMParsedResponse<T> {
  data: T;
  usage?: LLMUsage;
}

export abstract class LLMClient {
  public type: "openai" | "anthropic" | "cerebras" | "groq" | (string & {});
  public modelName: AvailableModel | (string & {});
  public hasVision: boolean;
  public clientOptions: ClientOptions;
  public userProvidedInstructions?: string;

  constructor(modelName: AvailableModel, userProvidedInstructions?: string) {
    this.modelName = modelName;
    this.userProvidedInstructions = userProvidedInstructions;
  }

  // Overload 1: When response_model is provided, returns LLMParsedResponse<T>
  abstract createChatCompletion<T>(
    options: CreateChatCompletionOptions & {
      options: {
        response_model: { name: string; schema: StagehandZodSchema };
      };
    },
  ): Promise<LLMParsedResponse<T>>;

  // Overload 2: When response_model is not provided, returns T (defaults to LLMResponse)
  abstract createChatCompletion<T = LLMResponse>(
    options: CreateChatCompletionOptions,
  ): Promise<T>;

  public generateObject = generateObject;
  public generateText = generateText;
  public streamText = streamText;
  public streamObject = streamObject;
  public generateImage = experimental_generateImage;
  public embed = embed;
  public embedMany = embedMany;
  public transcribe = experimental_transcribe;
  public generateSpeech = experimental_generateSpeech;

  getLanguageModel?(): LanguageModelV2;
}


================================================
FILE: packages/core/lib/v3/llm/LLMProvider.ts
================================================
import {
  ExperimentalNotConfiguredError,
  UnsupportedAISDKModelProviderError,
  UnsupportedModelError,
  UnsupportedModelProviderError,
} from "../types/public/sdkErrors.js";
import { LogLine } from "../types/public/logs.js";
import {
  AvailableModel,
  ClientOptions,
  ModelProvider,
} from "../types/public/model.js";
import { AISdkClient } from "./aisdk.js";
import { AnthropicClient } from "./AnthropicClient.js";
import { CerebrasClient } from "./CerebrasClient.js";
import { GoogleClient } from "./GoogleClient.js";
import { GroqClient } from "./GroqClient.js";
import { LLMClient } from "./LLMClient.js";
import { OpenAIClient } from "./OpenAIClient.js";
import { openai, createOpenAI } from "@ai-sdk/openai";
import { bedrock, createAmazonBedrock } from "@ai-sdk/amazon-bedrock";
import { vertex, createVertex } from "@ai-sdk/google-vertex";
import { anthropic, createAnthropic } from "@ai-sdk/anthropic";
import { google, createGoogleGenerativeAI } from "@ai-sdk/google";
import { xai, createXai } from "@ai-sdk/xai";
import { azure, createAzure } from "@ai-sdk/azure";
import { groq, createGroq } from "@ai-sdk/groq";
import { cerebras, createCerebras } from "@ai-sdk/cerebras";
import { togetherai, createTogetherAI } from "@ai-sdk/togetherai";
import { mistral, createMistral } from "@ai-sdk/mistral";
import { deepseek, createDeepSeek } from "@ai-sdk/deepseek";
import { perplexity, createPerplexity } from "@ai-sdk/perplexity";
import { ollama, createOllama } from "ollama-ai-provider-v2";
import { gateway, createGateway } from "ai";
import { AISDKProvider, AISDKCustomProvider } from "../types/public/model.js";

const AISDKProviders: Record<string, AISDKProvider> = {
  openai,
  bedrock,
  anthropic,
  google,
  xai,
  azure,
  groq,
  cerebras,
  togetherai,
  mistral,
  deepseek,
  perplexity,
  ollama,
  vertex,
  gateway,
};
const AISDKProvidersWithAPIKey: Record<string, AISDKCustomProvider> = {
  openai: createOpenAI,
  bedrock: createAmazonBedrock,
  anthropic: createAnthropic,
  google: createGoogleGenerativeAI,
  vertex: createVertex,
  xai: createXai,
  azure: createAzure,
  groq: createGroq,
  cerebras: createCerebras,
  togetherai: createTogetherAI,
  mistral: createMistral,
  deepseek: createDeepSeek,
  perplexity: createPerplexity,
  ollama: createOllama,
  gateway: createGateway,
};

const modelToProviderMap: { [key in AvailableModel]: ModelProvider } = {
  "gpt-4.1": "openai",
  "gpt-4.1-mini": "openai",
  "gpt-4.1-nano": "openai",
  "o4-mini": "openai",
  //prettier-ignore
  "o3": "openai",
  "o3-mini": "openai",
  //prettier-ignore
  "o1": "openai",
  "o1-mini": "openai",
  "gpt-4o": "openai",
  "gpt-4o-mini": "openai",
  "gpt-4o-2024-08-06": "openai",
  "gpt-4.5-preview": "openai",
  "o1-preview": "openai",
  "cerebras-llama-3.3-70b": "cerebras",
  "cerebras-llama-3.1-8b": "cerebras",
  "groq-llama-3.3-70b-versatile": "groq",
  "groq-llama-3.3-70b-specdec": "groq",
  "moonshotai/kimi-k2-instruct": "groq",
  "gemini-1.5-flash": "google",
  "gemini-1.5-pro": "google",
  "gemini-1.5-flash-8b": "google",
  "gemini-2.0-flash-lite": "google",
  "gemini-2.0-flash": "google",
  "gemini-2.5-flash-preview-04-17": "google",
  "gemini-2.5-pro-preview-03-25": "google",
};

export function getAISDKLanguageModel(
  subProvider: string,
  subModelName: string,
  clientOptions?: ClientOptions,
) {
  const hasValidOptions =
    clientOptions &&
    Object.values(clientOptions).some((v) => v !== undefined && v !== null);

  if (hasValidOptions) {
    const creator = AISDKProvidersWithAPIKey[subProvider];
    if (!creator) {
      throw new UnsupportedAISDKModelProviderError(
        subProvider,
        Object.keys(AISDKProvidersWithAPIKey),
      );
    }
    const provider = creator(clientOptions);
    // Get the specific model from the provider
    return provider(subModelName);
  } else {
    const provider = AISDKProviders[subProvider];
    if (!provider) {
      throw new UnsupportedAISDKModelProviderError(
        subProvider,
        Object.keys(AISDKProviders),
      );
    }
    return provider(subModelName);
  }
}

export class LLMProvider {
  private logger: (message: LogLine) => void;

  constructor(logger: (message: LogLine) => void) {
    this.logger = logger;
  }

  getClient(
    modelName: AvailableModel,
    clientOptions?: ClientOptions,
    options?: { experimental?: boolean; disableAPI?: boolean },
  ): LLMClient {
    if (modelName.includes("/")) {
      const firstSlashIndex = modelName.indexOf("/");
      const subProvider = modelName.substring(0, firstSlashIndex);
      const subModelName = modelName.substring(firstSlashIndex + 1);
      if (
        subProvider === "vertex" &&
        !options?.disableAPI &&
        !options?.experimental
      ) {
        throw new ExperimentalNotConfiguredError("Vertex provider");
      }

      const languageModel = getAISDKLanguageModel(
        subProvider,
        subModelName,
        clientOptions,
      );

      return new AISdkClient({
        model: languageModel,
        logger: this.logger,
      });
    }

    // Model name doesn't include "/" - this format is deprecated
    const provider = modelToProviderMap[modelName];
    if (!provider) {
      throw new UnsupportedModelError(Object.keys(modelToProviderMap));
    }

    this.logger({
      category: "llm",
      message: `Deprecation warning: Model format "${modelName}" is deprecated. Please use the provider/model format (e.g., "openai/gpt-5" or "anthropic/claude-sonnet-4").`,
      level: 0,
    });

    const availableModel = modelName as AvailableModel;
    switch (provider) {
      case "openai":
        return new OpenAIClient({
          logger: this.logger,
          modelName: availableModel,
          clientOptions,
        });
      case "anthropic":
        return new AnthropicClient({
          logger: this.logger,
          modelName: availableModel,
          clientOptions,
        });
      case "cerebras":
        return new CerebrasClient({
          logger: this.logger,
          modelName: availableModel,
          clientOptions,
        });
      case "groq":
        return new GroqClient({
          logger: this.logger,
          modelName: availableModel,
          clientOptions,
        });
      case "google":
        return new GoogleClient({
          logger: this.logger,
          modelName: availableModel,
          clientOptions,
        });
      default:
        // This default case handles unknown providers that exist in modelToProviderMap
        // but aren't implemented in the switch. This is an internal consistency issue.
        throw new UnsupportedModelProviderError([
          ...new Set(Object.values(modelToProviderMap)),
        ]);
    }
  }

  static getModelProvider(modelName: AvailableModel): ModelProvider {
    if (modelName.includes("/")) {
      const firstSlashIndex = modelName.indexOf("/");
      const subProvider = modelName.substring(0, firstSlashIndex);
      if (AISDKProviders[subProvider]) {
        return "aisdk";
      }
    }
    const provider = modelToProviderMap[modelName];
    return provider;
  }
}


================================================
FILE: packages/core/lib/v3/llm/OpenAIClient.ts
================================================
import OpenAI, { ClientOptions } from "openai";
import {
  ChatCompletionAssistantMessageParam,
  ChatCompletionContentPartImage,
  ChatCompletionContentPartText,
  ChatCompletionCreateParamsNonStreaming,
  ChatCompletionMessageParam,
  ChatCompletionSystemMessageParam,
  ChatCompletionUserMessageParam,
} from "openai/resources/chat";
import { LogLine } from "../types/public/logs.js";
import { AvailableModel } from "../types/public/model.js";
import { validateZodSchema } from "../../utils.js";
import {
  ChatCompletionOptions,
  ChatMessage,
  CreateChatCompletionOptions,
  LLMClient,
  LLMResponse,
} from "./LLMClient.js";
import {
  CreateChatCompletionResponseError,
  StagehandError,
  ZodSchemaValidationError,
} from "../types/public/sdkErrors.js";
import { toJsonSchema } from "../zodCompat.js";

export class OpenAIClient extends LLMClient {
  public type = "openai" as const;
  private client: OpenAI;
  declare public clientOptions: ClientOptions;

  constructor({
    modelName,
    clientOptions,
  }: {
    logger: (message: LogLine) => void;
    modelName: AvailableModel;
    clientOptions?: ClientOptions;
  }) {
    super(modelName);
    this.clientOptions = clientOptions;
    this.client = new OpenAI(clientOptions);
    this.modelName = modelName;
  }

  async createChatCompletion<T = LLMResponse>({
    options: optionsInitial,
    logger,
    retries = 3,
  }: CreateChatCompletionOptions): Promise<T> {
    let options: Partial<ChatCompletionOptions> = optionsInitial;

    // O1 models do not support most of the options. So we override them.
    // For schema and tools, we add them as user messages.
    let isToolsOverridedForO1 = false;
    if (this.modelName.startsWith("o1") || this.modelName.startsWith("o3")) {
      /* eslint-disable */
      // Remove unsupported options
      let {
        tool_choice,
        top_p,
        frequency_penalty,
        presence_penalty,
        temperature,
      } = options;
      ({
        tool_choice,
        top_p,
        frequency_penalty,
        presence_penalty,
        temperature,
        ...options
      } = options);
      /* eslint-enable */
      // Remove unsupported options
      options.messages = options.messages.map((message) => ({
        ...message,
        role: "user",
      }));
      if (options.tools && options.response_model) {
        throw new StagehandError(
          "Cannot use both tool and response_model for o1 models",
        );
      }

      if (options.tools) {
        // Remove unsupported options
        const { tools, ...rest } = options;
        options = rest;
        isToolsOverridedForO1 = true;
        options.messages.push({
          role: "user",
          content: `You have the following tools available to you:\n${JSON.stringify(
            tools,
          )}

          Respond with the following zod schema format to use a method: {
            "name": "<tool_name>",
            "arguments": <tool_args>
          }
          
          Do not include any other text or formattings like \`\`\` in your response. Just the JSON object.`,
        });
      }
    }
    if (
      options.temperature &&
      (this.modelName.startsWith("o1") || this.modelName.startsWith("o3"))
    ) {
      throw new StagehandError("Temperature is not supported for o1 models");
    }

    const { requestId, ...optionsWithoutImageAndRequestId } = options;

    logger({
      category: "openai",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        options: {
          value: JSON.stringify({
            ...optionsWithoutImageAndRequestId,
            requestId,
          }),
          type: "object",
        },
        modelName: {
          value: this.modelName,
          type: "string",
        },
      },
    });

    if (options.image) {
      const screenshotMessage: ChatMessage = {
        role: "user",
        content: [
          {
            type: "image_url",
            image_url: {
              url: `data:image/jpeg;base64,${options.image.buffer.toString("base64")}`,
            },
          },
          ...(options.image.description
            ? [{ type: "text", text: options.image.description }]
            : []),
        ],
      };

      options.messages.push(screenshotMessage);
    }

    let responseFormat:
      | ChatCompletionCreateParamsNonStreaming["response_format"]
      | undefined;
    if (options.response_model) {
      // For O1 models, we need to add the schema as a user message.
      if (this.modelName.startsWith("o1") || this.modelName.startsWith("o3")) {
        try {
          const parsedSchema = JSON.stringify(
            toJsonSchema(options.response_model.schema),
          );
          options.messages.push({
            role: "user",
            content: `Respond in this zod schema format:\n${parsedSchema}\n

          Do not include any other text, formatting or markdown in your output. Do not include \`\`\` or \`\`\`json in your response. Only the JSON object itself.`,
          });
        } catch (error) {
          logger({
            category: "openai",
            message: "Failed to parse response model schema",
            level: 0,
          });

          if (retries > 0) {
            // as-casting to account for o1 models not supporting all options
            return this.createChatCompletion({
              options: options as ChatCompletionOptions,
              logger,
              retries: retries - 1,
            });
          }

          throw error;
        }
      } else {
        responseFormat = {
          type: "json_schema",
          json_schema: {
            name: options.response_model.name,
            schema: toJsonSchema(options.response_model.schema),
          },
        };
      }
    }

    /* eslint-disable */
    // Remove unsupported options
    const { response_model, ...openAiOptions } = {
      ...optionsWithoutImageAndRequestId,
      model: this.modelName,
    };
    /* eslint-enable */

    logger({
      category: "openai",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        openAiOptions: {
          value: JSON.stringify(openAiOptions),
          type: "object",
        },
      },
    });

    const formattedMessages: ChatCompletionMessageParam[] =
      options.messages.map((message) => {
        if (Array.isArray(message.content)) {
          const contentParts = message.content.map((content) => {
            if ("image_url" in content) {
              const imageContent: ChatCompletionContentPartImage = {
                image_url: {
                  url: content.image_url.url,
                },
                type: "image_url",
              };
              return imageContent;
            } else {
              const textContent: ChatCompletionContentPartText = {
                text: content.text,
                type: "text",
              };
              return textContent;
            }
          });

          if (message.role === "system") {
            const formattedMessage: ChatCompletionSystemMessageParam = {
              ...message,
              role: "system",
              content: contentParts.filter(
                (content): content is ChatCompletionContentPartText =>
                  content.type === "text",
              ),
            };
            return formattedMessage;
          } else if (message.role === "user") {
            const formattedMessage: ChatCompletionUserMessageParam = {
              ...message,
              role: "user",
              content: contentParts,
            };
            return formattedMessage;
          } else {
            const formattedMessage: ChatCompletionAssistantMessageParam = {
              ...message,
              role: "assistant",
              content: contentParts.filter(
                (content): content is ChatCompletionContentPartText =>
                  content.type === "text",
              ),
            };
            return formattedMessage;
          }
        }

        const formattedMessage: ChatCompletionUserMessageParam = {
          role: "user",
          content: message.content,
        };

        return formattedMessage;
      });

    const body: ChatCompletionCreateParamsNonStreaming = {
      ...openAiOptions,
      model: this.modelName,
      messages: formattedMessages,
      response_format: responseFormat,
      stream: false,
      tools: options.tools?.map((tool) => ({
        function: {
          name: tool.name,
          description: tool.description,
          parameters: tool.parameters,
        },
        type: "function",
      })),
    };

    const response = await this.client.chat.completions.create(body);

    // For O1 models, we need to parse the tool call response manually and add it to the response.
    if (isToolsOverridedForO1) {
      try {
        const parsedContent = JSON.parse(response.choices[0].message.content);

        response.choices[0].message.tool_calls = [
          {
            function: {
              name: parsedContent["name"],
              arguments: JSON.stringify(parsedContent["arguments"]),
            },
            type: "function",
            id: "-1",
          },
        ];
        response.choices[0].message.content = null;
      } catch (error) {
        logger({
          category: "openai",
          message: "Failed to parse tool call response",
          level: 0,
          auxiliary: {
            error: {
              value: error.message,
              type: "string",
            },
            content: {
              value: response.choices[0].message.content,
              type: "string",
            },
          },
        });

        if (retries > 0) {
          // as-casting to account for o1 models not supporting all options
          return this.createChatCompletion({
            options: options as ChatCompletionOptions,
            logger,
            retries: retries - 1,
          });
        }

        throw error;
      }
    }

    logger({
      category: "openai",
      message: "response",
      level: 2,
      auxiliary: {
        response: {
          value: JSON.stringify(response),
          type: "object",
        },
        requestId: {
          value: requestId,
          type: "string",
        },
      },
    });

    if (options.response_model) {
      const extractedData = response.choices[0].message.content;
      const parsedData = JSON.parse(extractedData);

      try {
        validateZodSchema(options.response_model.schema, parsedData);
      } catch (e) {
        logger({
          category: "openai",
          message: "Response failed Zod schema validation",
          level: 0,
        });
        if (retries > 0) {
          // as-casting to account for o1 models not supporting all options
          return this.createChatCompletion({
            options: options as ChatCompletionOptions,
            logger,
            retries: retries - 1,
          });
        }

        if (e instanceof ZodSchemaValidationError) {
          logger({
            category: "openai",
            message: `Error during OpenAI chat completion: ${e.message}`,
            level: 0,
            auxiliary: {
              errorDetails: {
                value: `Message: ${e.message}${e.stack ? "\nStack: " + e.stack : ""}`,
                type: "string",
              },
              requestId: { value: requestId, type: "string" },
            },
          });
          throw new CreateChatCompletionResponseError(e.message);
        }
        throw e;
      }

      return {
        data: parsedData,
        usage: response.usage,
      } as T;
    }

    // if the function was called with a response model, it would have returned earlier
    // so we can safely cast here to T, which defaults to ChatCompletion
    return response as T;
  }
}


================================================
FILE: packages/core/lib/v3/llm/aisdk.ts
================================================
import {
  CoreAssistantMessage,
  ModelMessage,
  CoreSystemMessage,
  CoreUserMessage,
  generateObject,
  generateText,
  ImagePart,
  NoObjectGeneratedError,
  TextPart,
  ToolSet,
  Tool,
} from "ai";
import type { LanguageModelV2 } from "@ai-sdk/provider";
import { ChatCompletion } from "openai/resources";
import { v7 as uuidv7 } from "uuid";
import { LogLine } from "../types/public/logs.js";
import { AvailableModel } from "../types/public/model.js";
import { CreateChatCompletionOptions, LLMClient } from "./LLMClient.js";
import {
  FlowLogger,
  extractLlmPromptSummary,
} from "../flowlogger/FlowLogger.js";
import { toJsonSchema } from "../zodCompat.js";

export class AISdkClient extends LLMClient {
  public type = "aisdk" as const;
  private model: LanguageModelV2;
  private logger?: (message: LogLine) => void;

  constructor({
    model,
    logger,
  }: {
    model: LanguageModelV2;
    logger?: (message: LogLine) => void;
  }) {
    super(model.modelId as AvailableModel);
    this.model = model;
    this.logger = logger;
  }

  public getLanguageModel(): LanguageModelV2 {
    return this.model;
  }

  async createChatCompletion<T = ChatCompletion>({
    options,
  }: CreateChatCompletionOptions): Promise<T> {
    this.logger?.({
      category: "aisdk",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        options: {
          value: JSON.stringify({
            ...options,
            image: undefined,
            messages: options.messages.map((msg) => ({
              ...msg,
              content: Array.isArray(msg.content)
                ? msg.content.map((c) =>
                    "image_url" in c
                      ? { ...c, image_url: { url: "[IMAGE_REDACTED]" } }
                      : c,
                  )
                : msg.content,
            })),
          }),
          type: "object",
        },
        modelName: {
          value: this.model.modelId,
          type: "string",
        },
      },
    });

    const formattedMessages: ModelMessage[] = options.messages.map(
      (message) => {
        if (Array.isArray(message.content)) {
          if (message.role === "system") {
            const systemMessage: CoreSystemMessage = {
              role: "system",
              content: message.content
                .map((c) => ("text" in c ? c.text : ""))
                .join("\n"),
            };
            return systemMessage;
          }

          const contentParts = message.content.map((content) => {
            if ("image_url" in content) {
              const imageContent: ImagePart = {
                type: "image",
                image: content.image_url.url,
              };
              return imageContent;
            } else {
              const textContent: TextPart = {
                type: "text",
                text: content.text,
              };
              return textContent;
            }
          });

          if (message.role === "user") {
            const userMessage: CoreUserMessage = {
              role: "user",
              content: contentParts,
            };
            return userMessage;
          } else {
            const textOnlyParts = contentParts.map((part) => ({
              type: "text" as const,
              text: part.type === "image" ? "[Image]" : part.text,
            }));
            const assistantMessage: CoreAssistantMessage = {
              role: "assistant",
              content: textOnlyParts,
            };
            return assistantMessage;
          }
        }

        return {
          role: message.role,
          content: message.content,
        };
      },
    );

    let objectResponse: Awaited<ReturnType<typeof generateObject>>;
    const isGPT5 = this.model.modelId.includes("gpt-5");
    const isCodex = this.model.modelId.includes("codex");
    const usesLowReasoningEffort =
      (this.model.modelId.includes("gpt-5.1") ||
        this.model.modelId.includes("gpt-5.2")) &&
      !isCodex;
    // Kimi models only support temperature=1
    const isKimi = this.model.modelId.includes("kimi");
    const temperature = isKimi ? 1 : options.temperature;

    // Models that lack native structured-output support need a prompt-based
    // JSON fallback instead of response_format: { type: "json_schema" }.
    const PROMPT_JSON_FALLBACK_PATTERNS = ["deepseek", "kimi", "glm"];
    const needsPromptJsonFallback = PROMPT_JSON_FALLBACK_PATTERNS.some((p) =>
      this.model.modelId.includes(p),
    );

    if (options.response_model) {
      // Log LLM request for generateObject (extract)
      const llmRequestId = uuidv7();
      const promptSummary = extractLlmPromptSummary(options.messages, {
        hasSchema: true,
      });
      FlowLogger.logLlmRequest({
        requestId: llmRequestId,
        model: this.model.modelId,
        prompt: promptSummary,
      });

      // For models that don't support native structured outputs, add a prompt instruction
      if (needsPromptJsonFallback) {
        const parsedSchema = JSON.stringify(
          toJsonSchema(options.response_model.schema),
        );

        formattedMessages.push({
          role: "user",
          content: `Respond in this zod schema format:\n${parsedSchema}\n
You must respond in JSON format. respond WITH JSON. Do not include any other text, formatting or markdown in your output. Do not include \`\`\` or \`\`\`json in your response. Only the JSON object itself.`,
        });
      }

      try {
        objectResponse = await generateObject({
          model: this.model,
          messages: formattedMessages,
          schema: options.response_model.schema,
          temperature,
          providerOptions: isGPT5
            ? {
                openai: {
                  textVerbosity: isCodex ? "medium" : "low", // codex models only support 'medium'
                  reasoningEffort: isCodex
                    ? "medium"
                    : usesLowReasoningEffort
                      ? "low"
                      : "minimal",
                },
              }
            : undefined,
        });
      } catch (err) {
        // Log error response to maintain request/response pairing
        FlowLogger.logLlmResponse({
          requestId: llmRequestId,
          model: this.model.modelId,
          output: `[error: ${err instanceof Error ? err.message : "unknown"}]`,
        });

        if (NoObjectGeneratedError.isInstance(err)) {
          this.logger?.({
            category: "AISDK error",
            message: err.message,
            level: 0,
            auxiliary: {
              cause: {
                value: JSON.stringify(err.cause ?? {}),
                type: "object",
              },
              text: {
                value: err.text ?? "",
                type: "string",
              },
              response: {
                value: JSON.stringify(err.response ?? {}),
                type: "object",
              },
              usage: {
                value: JSON.stringify(err.usage ?? {}),
                type: "object",
              },
              finishReason: {
                value: err.finishReason ?? "unknown",
                type: "string",
              },
              requestId: {
                value: options.requestId,
                type: "string",
              },
            },
          });

          throw err;
        }
        throw err;
      }

      const result = {
        data: objectResponse.object,
        usage: {
          prompt_tokens: objectResponse.usage.inputTokens ?? 0,
          completion_tokens: objectResponse.usage.outputTokens ?? 0,
          reasoning_tokens: objectResponse.usage.reasoningTokens ?? 0,
          cached_input_tokens: objectResponse.usage.cachedInputTokens ?? 0,
          total_tokens: objectResponse.usage.totalTokens ?? 0,
        },
      } as T;

      // Log LLM response for generateObject
      FlowLogger.logLlmResponse({
        requestId: llmRequestId,
        model: this.model.modelId,
        output: JSON.stringify(objectResponse.object),
        inputTokens: objectResponse.usage.inputTokens,
        outputTokens: objectResponse.usage.outputTokens,
      });

      this.logger?.({
        category: "aisdk",
        message: "response",
        level: 1,
        auxiliary: {
          response: {
            value: JSON.stringify({
              object: objectResponse.object,
              usage: objectResponse.usage,
              finishReason: objectResponse.finishReason,
              // Omit request and response properties that might contain images
            }),
            type: "object",
          },
          requestId: {
            value: options.requestId,
            type: "string",
          },
        },
      });

      return result;
    }

    const tools: ToolSet = {};
    if (options.tools && options.tools.length > 0) {
      for (const tool of options.tools) {
        tools[tool.name] = {
          description: tool.description,
          inputSchema: tool.parameters,
        } as Tool;
      }
    }

    // Log LLM request for generateText (act/observe)
    const llmRequestId = uuidv7();
    const toolCount = Object.keys(tools).length;
    const promptSummary = extractLlmPromptSummary(options.messages, {
      toolCount,
    });
    FlowLogger.logLlmRequest({
      requestId: llmRequestId,
      model: this.model.modelId,
      prompt: promptSummary,
    });

    let textResponse: Awaited<ReturnType<typeof generateText>>;
    try {
      textResponse = await generateText({
        model: this.model,
        messages: formattedMessages,
        tools: Object.keys(tools).length > 0 ? tools : undefined,
        toolChoice:
          Object.keys(tools).length > 0
            ? options.tool_choice === "required"
              ? "required"
              : options.tool_choice === "none"
                ? "none"
                : "auto"
            : undefined,
        temperature,
      });
    } catch (err) {
      // Log error response to maintain request/response pairing
      FlowLogger.logLlmResponse({
        requestId: llmRequestId,
        model: this.model.modelId,
        output: `[error: ${err instanceof Error ? err.message : "unknown"}]`,
      });
      throw err;
    }

    // Transform AI SDK response to match LLMResponse format expected by operator handler
    const transformedToolCalls = (textResponse.toolCalls || []).map(
      (toolCall) => ({
        id:
          toolCall.toolCallId ||
          `call_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`,
        type: "function",
        function: {
          name: toolCall.toolName,
          arguments: JSON.stringify(toolCall.input),
        },
      }),
    );

    const result = {
      id: `chatcmpl_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`,
      object: "chat.completion",
      created: Math.floor(Date.now() / 1000),
      model: this.model.modelId,
      choices: [
        {
          index: 0,
          message: {
            role: "assistant",
            content: textResponse.text || null,
            tool_calls: transformedToolCalls,
          },
          finish_reason: textResponse.finishReason || "stop",
        },
      ],
      usage: {
        prompt_tokens: textResponse.usage.inputTokens ?? 0,
        completion_tokens: textResponse.usage.outputTokens ?? 0,
        reasoning_tokens: textResponse.usage.reasoningTokens ?? 0,
        cached_input_tokens: textResponse.usage.cachedInputTokens ?? 0,
        total_tokens: textResponse.usage.totalTokens ?? 0,
      },
    } as T;

    // Log LLM response for generateText
    FlowLogger.logLlmResponse({
      requestId: llmRequestId,
      model: this.model.modelId,
      output:
        textResponse.text ||
        (transformedToolCalls.length > 0
          ? `[${transformedToolCalls.length} tool calls]`
          : ""),
      inputTokens: textResponse.usage.inputTokens,
      outputTokens: textResponse.usage.outputTokens,
    });

    this.logger?.({
      category: "aisdk",
      message: "response",
      level: 2,
      auxiliary: {
        response: {
          value: JSON.stringify({
            text: textResponse.text,
            usage: textResponse.usage,
            finishReason: textResponse.finishReason,
            // Omit request and response properties that might contain images
          }),
          type: "object",
        },
        requestId: {
          value: options.requestId,
          type: "string",
        },
      },
    });

    return result;
  }
}


================================================
FILE: packages/core/lib/v3/logger.ts
================================================
import type { LogLine } from "./types/public/logs.js";
import { AsyncLocalStorage } from "node:async_hooks";

/**
 * Stagehand V3 Logging
 *
 * Design goals:
 * - Support concurrent V3 instances with independent logger configuration
 * - Each V3 instance has its own StagehandLogger (handles usePino, verbose, externalLogger)
 * - Provide AsyncLocalStorage-based routing for backward compatibility with handler code
 * - Prevent cross-talk between concurrent instances
 *
 * How it works:
 * - Each V3 instance creates a StagehandLogger in its constructor (per-instance config)
 * - bindInstanceLogger()/unbindInstanceLogger(): registers logger callback per instance ID
 * - withInstanceLogContext(): establishes AsyncLocalStorage context for an async operation
 * - v3Logger(): routes logs using AsyncLocalStorage with console fallback
 *
 * ⚠️ CONTEXT LOSS SCENARIOS:
 * 1. setTimeout/setInterval callbacks lose context (runs outside AsyncLocalStorage scope)
 * 2. Event emitters (EventEmitter.on) lose context (callback invoked outside scope)
 * 3. Fire-and-forget promises (void promise) lose context if they don't complete synchronously
 * 4. Third-party library callbacks may lose context depending on implementation
 *
 * WORKAROUND for context loss:
 * - Use explicit logger parameter instead of v3Logger()
 * - Wrap callback in withInstanceLogContext() manually
 * - Or let logs fall back to console (acceptable for edge cases)
 */

// Per-instance routing using AsyncLocalStorage
const logContext = new AsyncLocalStorage<string>();
const instanceLoggers = new Map<string, (line: LogLine) => void>();

export function bindInstanceLogger(
  instanceId: string,
  logger: (line: LogLine) => void,
): void {
  instanceLoggers.set(instanceId, logger);
}

export function unbindInstanceLogger(instanceId: string): void {
  instanceLoggers.delete(instanceId);
}

export function withInstanceLogContext<T>(instanceId: string, fn: () => T): T {
  return logContext.run(instanceId, fn);
}

/**
 * Routes logs to the appropriate instance logger based on AsyncLocalStorage context.
 * Falls back to console output if no instance context is available.
 */
export function v3Logger(line: LogLine): void {
  const id = logContext.getStore();
  if (id) {
    const fn = instanceLoggers.get(id);
    if (fn) {
      const enriched: LogLine = {
        ...line,
        auxiliary: {
          ...(line.auxiliary || {}),
        },
      };
      try {
        fn(enriched);
        return;
      } catch {
        // fallback to console below
      }
    }
  }

  // Fallback: log to console when no instance context
  const ts = line.timestamp ?? new Date().toISOString();
  const lvl = line.level ?? 1;
  const levelStr = lvl === 0 ? "ERROR" : lvl === 2 ? "DEBUG" : "INFO";
  let output = `[${ts}] ${levelStr}: ${line.message}`;

  if (line.auxiliary) {
    for (const [key, { value, type }] of Object.entries(line.auxiliary)) {
      let formattedValue = value;
      if (type === "object") {
        try {
          formattedValue = JSON.stringify(JSON.parse(value), null, 2)
            .split("\n")
            .map((line, i) => (i === 0 ? line : `    ${line}`))
            .join("\n");
        } catch {
          formattedValue = value;
        }
      }
      output += `\n    ${key}: ${formattedValue}`;
    }
  }

  if (lvl === 0) {
    console.error(output);
  } else if (lvl === 2) {
    (console.debug ?? console.log)(output);
  } else {
    console.log(output);
  }
}


================================================
FILE: packages/core/lib/v3/mcp/connection.ts
================================================
import {
  Client,
  ClientOptions,
} from "@modelcontextprotocol/sdk/client/index.js";
import {
  StreamableHTTPClientTransport,
  type StreamableHTTPClientTransportOptions,
} from "@modelcontextprotocol/sdk/client/streamableHttp.js";
import { StdioClientTransport } from "@modelcontextprotocol/sdk/client/stdio.js";
import { MCPConnectionError } from "../types/public/sdkErrors.js";

export interface ConnectToMCPServerOptions {
  serverUrl: string | URL;
  clientOptions?: ClientOptions;
  requestOptions?: StreamableHTTPClientTransportOptions;
}

export interface StdioServerConfig {
  command: string;
  args?: string[];
  env?: Record<string, string>;
}

export const connectToMCPServer = async (
  serverConfig: string | URL | StdioServerConfig | ConnectToMCPServerOptions,
): Promise<Client> => {
  try {
    let transport;
    let clientOptions: ClientOptions | undefined;
    let requestOptions: StreamableHTTPClientTransportOptions | undefined;

    // Check if it's a stdio config (has 'command' property)
    if (typeof serverConfig === "object" && "command" in serverConfig) {
      transport = new StdioClientTransport(serverConfig);
    } else {
      // Handle URL-based connection
      let serverUrl: string | URL;

      if (typeof serverConfig === "string" || serverConfig instanceof URL) {
        serverUrl = serverConfig;
      } else {
        serverUrl = (serverConfig as ConnectToMCPServerOptions).serverUrl;
        clientOptions = (serverConfig as ConnectToMCPServerOptions)
          .clientOptions;
        requestOptions = (serverConfig as ConnectToMCPServerOptions)
          .requestOptions;
      }

      transport = new StreamableHTTPClientTransport(
        new URL(serverUrl),
        requestOptions,
      );
    }

    const client = new Client({
      name: "Stagehand",
      version: "1.0.0",
      ...clientOptions,
    });

    await client.connect(transport);

    try {
      await client.ping();
    } catch (pingError) {
      await client.close();
      throw new MCPConnectionError(serverConfig.toString(), pingError);
    }

    return client;
  } catch (error) {
    // Handle any errors during transport/client creation or connection
    if (error instanceof MCPConnectionError) {
      throw error; // Re-throw our custom error
    }
    throw new MCPConnectionError(serverConfig.toString(), error);
  }
};


================================================
FILE: packages/core/lib/v3/mcp/utils.ts
================================================
import { Client } from "@modelcontextprotocol/sdk/client/index.js";
import { ToolSet } from "ai";
import { JsonSchema, jsonSchemaToZod } from "../../utils.js";
import { connectToMCPServer } from "./connection.js";

export const resolveTools = async (
  clients: (Client | string)[],
  userTools: ToolSet,
): Promise<ToolSet> => {
  const tools: ToolSet = { ...userTools };

  for (const client of clients) {
    let clientInstance: Client;
    if (typeof client === "string") {
      clientInstance = await connectToMCPServer(client);
    } else {
      clientInstance = client;
    }

    let nextCursor: string | undefined = undefined;

    do {
      const clientTools = await clientInstance.listTools({
        cursor: nextCursor,
      });

      for (const tool of clientTools.tools) {
        tools[tool.name] = {
          description: tool.description,
          inputSchema: jsonSchemaToZod(tool.inputSchema as JsonSchema),
          execute: async (input) => {
            const result = await clientInstance.callTool({
              name: tool.name,
              arguments: input,
            });
            return result;
          },
        };
      }
      nextCursor = clientTools.nextCursor;
    } while (nextCursor);
  }

  return tools;
};


================================================
FILE: packages/core/lib/v3/runtimePaths.ts
================================================
/**
 * Keep this file in sync with:
 * - /packages/core/lib/v3/runtimePaths.ts
 * - /packages/server-v3/scripts/runtimePaths.ts
 * - /packages/server-v4/scripts/runtimePaths.ts
 * - /packages/evals/runtimePaths.ts
 * - /packages/docs/scripts/runtimePaths.js
 */
import path from "node:path";
import { fileURLToPath } from "node:url";
import { createRequire } from "node:module";

const PACKAGE_SEGMENT = "/packages/core/";
const EVAL_FRAMES = new Set(["[eval]", "[eval]-wrapper"]);
const INTERNAL_FRAME_NAMES = new Set([
  "readCallsites",
  "readCallsitePath",
  "resolveCallerFilePath",
  "getCurrentFilePath",
  "getCurrentDirPath",
  "getRepoRootDir",
  "getPackageRootDir",
  "createRequireFromCaller",
  "isMainModule",
]);

const normalizePath = (value: string): string => {
  const input = value.startsWith("file://") ? fileURLToPath(value) : value;
  return path.resolve(input).replaceAll("\\", "/");
};

const readCallsites = (): NodeJS.CallSite[] => {
  const previousPrepare = Error.prepareStackTrace;
  try {
    Error.prepareStackTrace = (_, stack) => stack;
    return (
      (new Error().stack as unknown as NodeJS.CallSite[] | undefined) ?? []
    );
  } finally {
    Error.prepareStackTrace = previousPrepare;
  }
};

type CallSiteWithScriptName = NodeJS.CallSite & {
  getScriptNameOrSourceURL?: () => string | null;
};

const readCallsitePath = (callsite: NodeJS.CallSite): string | null => {
  const callsiteWithScript = callsite as CallSiteWithScriptName;
  const rawPath =
    callsite.getFileName() ?? callsiteWithScript.getScriptNameOrSourceURL?.();
  if (!rawPath) return null;
  if (rawPath.startsWith("node:")) return null;
  if (EVAL_FRAMES.has(rawPath)) return null;
  return normalizePath(rawPath);
};

const isInternalCallsite = (callsite: NodeJS.CallSite): boolean => {
  const functionName = callsite.getFunctionName();
  if (functionName && INTERNAL_FRAME_NAMES.has(functionName)) return true;

  const methodName = callsite.getMethodName();
  if (methodName && INTERNAL_FRAME_NAMES.has(methodName)) return true;

  const callsiteString = callsite.toString();
  for (const frameName of INTERNAL_FRAME_NAMES) {
    if (callsiteString.includes(`${frameName} (`)) return true;
    if (callsiteString.includes(`.${frameName} (`)) return true;
  }
  return false;
};

const resolveCallerFilePath = (): string => {
  const packageCandidates: string[] = [];
  const fallbackCandidates: string[] = [];

  for (const callsite of readCallsites()) {
    const filePath = readCallsitePath(callsite);
    if (!filePath) continue;
    if (isInternalCallsite(callsite)) continue;
    if (filePath.includes(PACKAGE_SEGMENT)) {
      packageCandidates.push(filePath);
      continue;
    }
    fallbackCandidates.push(filePath);
  }

  const packageCandidate = packageCandidates[0];
  if (packageCandidate) return packageCandidate;

  const fallbackCandidate = fallbackCandidates[0];
  if (fallbackCandidate) return fallbackCandidate;

  throw new Error("Unable to resolve caller file path.");
};

export const getCurrentFilePath = (): string => resolveCallerFilePath();

export const getCurrentDirPath = (): string =>
  path.dirname(getCurrentFilePath());

export const getRepoRootDir = (): string => {
  const currentFilePath = getCurrentFilePath();
  const index = currentFilePath.lastIndexOf(PACKAGE_SEGMENT);
  if (index === -1) {
    throw new Error(
      `Unable to determine repo root from ${currentFilePath} (missing ${PACKAGE_SEGMENT}).`,
    );
  }
  return currentFilePath.slice(0, index);
};

export const getPackageRootDir = (): string =>
  `${getRepoRootDir()}${PACKAGE_SEGMENT.slice(0, -1)}`;

export const createRequireFromCaller = () =>
  createRequire(getCurrentFilePath());

export const isMainModule = (): boolean => {
  const entryScript = process.argv.at(1);
  if (!entryScript) return false;
  return normalizePath(entryScript) === getCurrentFilePath();
};


================================================
FILE: packages/core/lib/v3/shutdown/cleanupLocal.ts
================================================
import fs from "node:fs";

/**
 * Shared cleanup logic for locally launched Chrome.
 *
 * Used by both `V3.close()` (normal shutdown) and the supervisor process
 * (crash cleanup). The caller provides a `killChrome` callback since the
 * kill mechanism differs: chrome-launcher's `chrome.kill()` in-process
 * vs raw `process.kill(pid)` from the supervisor.
 */
export async function cleanupLocalBrowser(opts: {
  killChrome?: () => Promise<void> | void;
  userDataDir?: string;
  createdTempProfile?: boolean;
  preserveUserDataDir?: boolean;
}): Promise<void> {
  if (opts.killChrome) {
    try {
      await opts.killChrome();
    } catch {
      // best-effort
    }
  }
  if (
    opts.createdTempProfile &&
    !opts.preserveUserDataDir &&
    opts.userDataDir
  ) {
    try {
      fs.rmSync(opts.userDataDir, { recursive: true, force: true });
    } catch {
      // ignore cleanup errors
    }
  }
}


================================================
FILE: packages/core/lib/v3/shutdown/supervisor.ts
================================================
/**
 * Shutdown supervisor process.
 *
 * This process watches a stdin lifeline. When the parent dies, stdin closes
 * and the supervisor performs best-effort cleanup:
 * - LOCAL: kill Chrome + remove temp profile
 * - STAGEHAND_API: request session release
 */

import Browserbase from "@browserbasehq/sdk";
import type { ShutdownSupervisorConfig } from "../types/private/shutdown.js";
import { cleanupLocalBrowser } from "./cleanupLocal.js";

const SIGKILL_POLL_MS = 250;
const SIGKILL_TIMEOUT_MS = 7_000;
const PID_POLL_INTERVAL_MS = 500;

// `cleanupPromise` guarantees we execute cleanup at most once.
let config: ShutdownSupervisorConfig | null = null;
let cleanupPromise: Promise<void> | null = null;
let started = false;
let localPidKnownGone = false;

const exit = (code = 0): void => {
  try {
    process.exit(code);
  } catch {
    // ignore
  }
};

// Best-effort two-phase kill: SIGTERM first, then SIGKILL after timeout.
// Treat only ESRCH as "already gone"; other errors should not imply dead.
const politeKill = async (pid: number): Promise<void> => {
  const isAlive = (): boolean => {
    try {
      process.kill(pid, 0);
      return true;
    } catch (error) {
      const err = error as NodeJS.ErrnoException;
      // ESRCH = "No such process" (PID is already gone).
      return err.code !== "ESRCH";
    }
  };

  if (!isAlive()) return;
  try {
    process.kill(pid, "SIGTERM");
  } catch (error) {
    const err = error as NodeJS.ErrnoException;
    // ESRCH = process already exited; no further action needed.
    if (err.code === "ESRCH") return;
  }

  const deadline = Date.now() + SIGKILL_TIMEOUT_MS;
  while (Date.now() < deadline) {
    await new Promise((resolve) => setTimeout(resolve, SIGKILL_POLL_MS));
    if (!isAlive()) return;
  }
  try {
    process.kill(pid, "SIGKILL");
  } catch {
    // best-effort
  }
};

let pidPollTimer: NodeJS.Timeout | null = null;

// Local-only fallback: if Chrome dies while parent still lives, run cleanup and exit.
const startPidPolling = (pid: number): void => {
  if (pidPollTimer) return;
  pidPollTimer = setInterval(() => {
    try {
      process.kill(pid, 0);
      return;
    } catch (error) {
      const err = error as NodeJS.ErrnoException;
      // Only ESRCH means the process is definitely gone.
      if (err.code !== "ESRCH") return;
    }

    localPidKnownGone = true;
    if (pidPollTimer) {
      clearInterval(pidPollTimer);
      pidPollTimer = null;
    }
    void runCleanup("Browser process exited").finally(() => exit(0));
  }, PID_POLL_INTERVAL_MS);
};

const cleanupLocal = async (
  cfg: Extract<ShutdownSupervisorConfig, { kind: "LOCAL" }>,
  reason: string,
) => {
  const deletingUserDataDir = Boolean(
    cfg.createdTempProfile && !cfg.preserveUserDataDir && cfg.userDataDir,
  );
  await cleanupLocalBrowser({
    // If polling already observed ESRCH, avoid a follow-up PID kill.
    // The PID could be reused by a different process before cleanup runs.
    killChrome:
      cfg.pid && !localPidKnownGone
        ? () => {
            console.error(
              `[shutdown-supervisor] Shutting down Chrome pid=${cfg.pid} ` +
                `(reason=${reason}, deletingUserDataDir=${deletingUserDataDir})`,
            );
            return politeKill(cfg.pid);
          }
        : undefined,
    userDataDir: cfg.userDataDir,
    createdTempProfile: cfg.createdTempProfile,
    preserveUserDataDir: cfg.preserveUserDataDir,
  });
};

const cleanupBrowserbase = async (
  cfg: Extract<ShutdownSupervisorConfig, { kind: "STAGEHAND_API" }>,
  reason: string,
) => {
  if (!cfg.apiKey || !cfg.sessionId) return;
  try {
    console.error(
      `[shutdown-supervisor] Ending Browserbase session ${cfg.sessionId} ` +
        `(reason=${reason})`,
    );
    const bb = new Browserbase({ apiKey: cfg.apiKey });
    await bb.sessions.update(cfg.sessionId, {
      status: "REQUEST_RELEASE",
      ...(cfg.projectId ? { projectId: cfg.projectId } : {}),
    } as Browserbase.Sessions.SessionUpdateParams);
  } catch {
    // best-effort cleanup
  }
};

// Idempotent cleanup entrypoint used by all supervisor shutdown paths.
const runCleanup = (reason: string): Promise<void> => {
  if (!cleanupPromise) {
    cleanupPromise = (async () => {
      const cfg = config;
      if (!cfg) return;
      if (cfg.kind === "LOCAL") {
        await cleanupLocal(cfg, reason);
        return;
      }
      if (cfg.kind === "STAGEHAND_API") {
        await cleanupBrowserbase(cfg, reason);
      }
    })();
  }
  return cleanupPromise;
};

const applyConfig = (nextConfig: ShutdownSupervisorConfig): void => {
  config = nextConfig;
  localPidKnownGone = false;
  if (config.kind === "LOCAL" && config.pid) {
    startPidPolling(config.pid);
  }
};

const onLifelineClosed = (reason: string) => {
  void runCleanup(reason).finally(() => exit(0));
};

const parseConfigFromArgv = (
  argv: readonly string[] = process.argv.slice(2),
): ShutdownSupervisorConfig | null => {
  const prefix = "--supervisor-config=";
  const raw = argv.find((arg) => arg.startsWith(prefix))?.slice(prefix.length);
  if (!argv.includes("--supervisor") || !raw) return null;
  try {
    return JSON.parse(raw) as ShutdownSupervisorConfig;
  } catch {
    return null;
  }
};

export const runShutdownSupervisor = (
  initialConfig: ShutdownSupervisorConfig,
): void => {
  if (started) return;
  started = true;
  applyConfig(initialConfig);

  // Stdin is the lifeline; losing it means parent is gone.
  try {
    process.stdin.resume();
    process.stdin.on("end", () =>
      onLifelineClosed("Stagehand process completed"),
    );
    process.stdin.on("close", () =>
      onLifelineClosed("Stagehand process completed"),
    );
    process.stdin.on("error", () =>
      onLifelineClosed("Stagehand process crashed or was killed"),
    );
  } catch {
    // ignore
  }
};

export const maybeRunShutdownSupervisorFromArgv = (
  argv: readonly string[] = process.argv.slice(2),
): boolean => {
  const parsed = parseConfigFromArgv(argv);
  if (!parsed) return false;
  runShutdownSupervisor(parsed);
  return true;
};


================================================
FILE: packages/core/lib/v3/shutdown/supervisorClient.ts
================================================
/**
 * Parent-side helper for spawning the shutdown supervisor process.
 *
 * The supervisor runs out-of-process and watches a lifeline pipe. If the parent
 * dies, the supervisor performs best-effort cleanup (Chrome kill or Browserbase
 * session release) when keepAlive is false.
 */

import fs from "node:fs";
import path from "node:path";
import { spawn } from "node:child_process";
import { createRequire } from "node:module";
import type {
  ShutdownSupervisorConfig,
  ShutdownSupervisorHandle,
} from "../types/private/shutdown.js";
import {
  ShutdownSupervisorResolveError,
  ShutdownSupervisorSpawnError,
} from "../types/private/shutdownErrors.js";
import { getCurrentFilePath } from "../runtimePaths.js";

const moduleFilename = getCurrentFilePath();
const moduleDir = path.dirname(moduleFilename);
const nodeRequire = createRequire(moduleFilename);

const isSeaRuntime = (): boolean => {
  try {
    const sea = nodeRequire("node:sea") as { isSea?: () => boolean };
    return Boolean(sea.isSea?.());
  } catch {
    return false;
  }
};

// SEA: re-exec current binary with supervisor args.
// Non-SEA: execute Stagehand CLI entrypoint with supervisor args.
const resolveCliPath = (): string => `${moduleDir}/../cli.js`;

const resolveSupervisorCommand = (
  config: ShutdownSupervisorConfig,
): {
  command: string;
  args: string[];
} | null => {
  const baseArgs = ["--supervisor", serializeConfigArg(config)];

  if (isSeaRuntime()) {
    return { command: process.execPath, args: baseArgs };
  }

  const cliPath = resolveCliPath();
  if (!fs.existsSync(cliPath)) return null;
  const needsTsxLoader =
    fs.existsSync(`${moduleDir}/supervisor.ts`) &&
    !fs.existsSync(`${moduleDir}/supervisor.js`);
  return {
    command: process.execPath,
    args: needsTsxLoader
      ? ["--import", "tsx", cliPath, ...baseArgs]
      : [cliPath, ...baseArgs],
  };
};

// Single JSON arg keeps supervisor bootstrap parsing tiny and versionable.
const serializeConfigArg = (config: ShutdownSupervisorConfig): string =>
  `--supervisor-config=${JSON.stringify({
    ...config,
    parentPid: process.pid,
  })}`;

/**
 * Start a supervisor process for crash cleanup. Returns a handle that can
 * stop the supervisor during a normal shutdown.
 */
export function startShutdownSupervisor(
  config: ShutdownSupervisorConfig,
  opts?: { onError?: (error: Error, context: string) => void },
): ShutdownSupervisorHandle | null {
  const resolved = resolveSupervisorCommand(config);
  if (!resolved) {
    opts?.onError?.(
      new ShutdownSupervisorResolveError(
        "Shutdown supervisor entry missing (expected Stagehand CLI entrypoint).",
      ),
      "resolve",
    );
    return null;
  }

  const child = spawn(resolved.command, resolved.args, {
    // stdin is the parent lifeline.
    // Preserve supervisor stderr so crash-cleanup debug lines are visible.
    stdio: ["pipe", "ignore", "inherit"],
    detached: true,
  });
  child.on("error", (error) => {
    opts?.onError?.(
      new ShutdownSupervisorSpawnError(
        `Shutdown supervisor failed to start: ${error.message}`,
      ),
      "spawn",
    );
  });

  try {
    child.unref();
    const stdin = child.stdin as unknown as { unref?: () => void } | null;
    stdin?.unref?.();
  } catch {
    // best-effort: avoid keeping the event loop alive
  }

  const stop = () => {
    // Normal close path: terminate supervisor directly.
    try {
      child.kill("SIGTERM");
    } catch {
      // ignore
    }
  };

  return { stop };
}


================================================
FILE: packages/core/lib/v3/timeoutConfig.ts
================================================
import { TimeoutError } from "./types/public/sdkErrors.js";

export function getEnvTimeoutMs(name: string): number | undefined {
  const raw = process.env[name];
  if (!raw) return undefined;
  const normalized = raw.trim().replace(/ms$/i, "");
  const value = Number(normalized);
  if (!Number.isFinite(value) || value <= 0) return undefined;
  return value;
}

export async function withTimeout<T>(
  promise: Promise<T>,
  timeoutMs: number | null | undefined,
  operation: string,
): Promise<T> {
  if (
    typeof timeoutMs !== "number" ||
    !Number.isFinite(timeoutMs) ||
    timeoutMs <= 0
  ) {
    return await promise;
  }

  let timeoutId: NodeJS.Timeout | undefined;
  const timeoutPromise = new Promise<never>((_, reject) => {
    timeoutId = setTimeout(() => {
      reject(new TimeoutError(operation, timeoutMs));
    }, timeoutMs);
  });
  try {
    return await Promise.race([promise, timeoutPromise]);
  } finally {
    if (timeoutId) clearTimeout(timeoutId);
  }
}


================================================
FILE: packages/core/lib/v3/types/private/agent.ts
================================================
export interface ActionMappingOptions {
  toolCallName: string;
  toolResult: unknown;
  args: Record<string, unknown>;
  reasoning?: string;
}


================================================
FILE: packages/core/lib/v3/types/private/api.ts
================================================
import type { Protocol } from "devtools-protocol";

export interface SerializableResponse {
  requestId: string;
  frameId?: string;
  loaderId?: string;
  response: Protocol.Network.Response;
  fromServiceWorkerFlag?: boolean;
  finishedSettled?: boolean;
  extraInfoHeaders?: Protocol.Network.Headers | null;
  extraInfoHeadersText?: string;
}


================================================
FILE: packages/core/lib/v3/types/private/cache.ts
================================================
import type {
  ActOptions,
  ActResult,
  AvailableModel,
  Logger,
  AgentResult,
  Action,
  LoadState,
} from "../public/index.js";
import { CacheStorage } from "../../cache/CacheStorage.js";
import type { ActHandler } from "../../handlers/actHandler.js";
import type { V3Context } from "../../understudy/context.js";
import type { LLMClient } from "../../llm/LLMClient.js";

export type ActFn = (
  instruction: string,
  options?: ActOptions,
) => Promise<ActResult>;

export type AgentCacheContext = {
  instruction: string;
  startUrl: string;
  options: SanitizedAgentExecuteOptions;
  configSignature: string;
  cacheKey: string;
  variableKeys: string[] /** Variable keys used in this execution (for cache key) */;
  /** Variable values to substitute during replay */
  variables?: Record<string, string>;
};

export type AgentCacheTransferPayload = {
  cacheKey: string;
  entry: CachedAgentEntry;
};

export type AgentCacheDeps = {
  storage: CacheStorage;
  logger: Logger;
  getActHandler: () => ActHandler | null;
  getContext: () => V3Context | null;
  getDefaultLlmClient: () => LLMClient;
  getBaseModelName: () => AvailableModel;
  getSystemPrompt: () => string | undefined;
  domSettleTimeoutMs?: number;
  act: ActFn;
  bufferLatestEntry?: boolean;
};

export type ActCacheContext = {
  instruction: string;
  cacheKey: string;
  pageUrl: string;
  variableKeys: string[];
  variables?: Record<string, string>;
};

export type ActCacheDeps = {
  storage: CacheStorage;
  logger: Logger;
  getActHandler: () => ActHandler | null;
  getDefaultLlmClient: () => LLMClient;
  domSettleTimeoutMs?: number;
};

export type ReadJsonResult<T> = {
  value: T | null;
  path?: string;
  error?: unknown;
};

export type WriteJsonResult = {
  path?: string;
  error?: unknown;
};

export interface CachedActEntry {
  version: 1;
  instruction: string;
  url: string;
  variableKeys: string[];
  actions: Action[];
  actionDescription?: string;
  message?: string;
}

export type AgentReplayStep =
  | AgentReplayActStep
  | AgentReplayFillFormStep
  | AgentReplayGotoStep
  | AgentReplayScrollStep
  | AgentReplayWaitStep
  | AgentReplayNavBackStep
  | AgentReplayKeysStep
  | { type: string; [key: string]: unknown };

export interface AgentReplayActStep {
  type: "act";
  instruction: string;
  actions?: Action[];
  actionDescription?: string;
  message?: string;
  timeout?: number;
}

export interface AgentReplayFillFormStep {
  type: "fillForm";
  fields?: Array<{ action: string }>;
  observeResults?: Action[];
  actions?: Action[];
}

export interface AgentReplayGotoStep {
  type: "goto";
  url: string;
  waitUntil?: LoadState;
}

export interface AgentReplayScrollStep {
  type: "scroll";
  deltaX?: number;
  deltaY?: number;
  anchor?: { x: number; y: number };
}

export interface AgentReplayWaitStep {
  type: "wait";
  timeMs: number;
}

export interface AgentReplayNavBackStep {
  type: "navback";
  waitUntil?: LoadState;
}

export interface AgentReplayKeysStep {
  type: "keys";
  instruction?: string;
  playwrightArguments: {
    method: "type" | "press";
    text?: string;
    keys?: string;
    times?: number;
  };
}

export interface SanitizedAgentExecuteOptions {
  maxSteps?: number;
  highlightCursor?: boolean;
}

export interface CachedAgentEntry {
  version: 1;
  instruction: string;
  startUrl: string;
  options: SanitizedAgentExecuteOptions;
  configSignature: string;
  steps: AgentReplayStep[];
  result: AgentResult;
  timestamp: string;
}


================================================
FILE: packages/core/lib/v3/types/private/evaluator.ts
================================================
export type EvaluateOptions = {
  /** The question to ask about the task state */
  question: string;
  /** The answer to the question */
  answer?: string;
  /** Whether to take a screenshot of the task state, or array of screenshots to evaluate */
  screenshot?: boolean | Buffer[];
  /** Custom system prompt for the evaluator */
  systemPrompt?: string;
  /** Delay in milliseconds before taking the screenshot @default 250 */
  screenshotDelayMs?: number;
  /** The agent's reasoning/thought process for completing the task */
  agentReasoning?: string;
};

export type BatchAskOptions = {
  /** Array of questions with optional answers */
  questions: Array<{
    question: string;
    answer?: string;
  }>;
  /** Whether to take a screenshot of the task state */
  screenshot?: boolean;
  /** Custom system prompt for the evaluator */
  systemPrompt?: string;
  /** Delay in milliseconds before taking the screenshot @default 1000 */
  screenshotDelayMs?: number;
};

/**
 * Result of an evaluation
 */
export interface EvaluationResult {
  /**
   * The evaluation result ('YES', 'NO', or 'INVALID' if parsing failed or value was unexpected)
   */
  evaluation: "YES" | "NO" | "INVALID";
  /**
   * The reasoning behind the evaluation
   */
  reasoning: string;
}


================================================
FILE: packages/core/lib/v3/types/private/handlers.ts
================================================
import { Page } from "../../understudy/page.js";
import { ModelConfiguration } from "../public/model.js";
import type { StagehandZodSchema } from "../../zodCompat.js";
import type { Variables } from "../public/agent.js";

export interface ActHandlerParams {
  instruction: string;
  model?: ModelConfiguration;
  variables?: Variables;
  timeout?: number;
  page: Page;
}

export interface ExtractHandlerParams<T extends StagehandZodSchema> {
  instruction?: string;
  schema?: T;
  model?: ModelConfiguration;
  timeout?: number;
  selector?: string;
  page: Page;
}

export interface ObserveHandlerParams {
  instruction?: string;
  model?: ModelConfiguration;
  timeout?: number;
  selector?: string;
  page: Page;
}

// We can use this enum to list the actions supported in performUnderstudyMethod
export enum SupportedUnderstudyAction {
  CLICK = "click",
  FILL = "fill",
  TYPE = "type",
  PRESS = "press",
  SCROLL = "scrollTo",
  NEXT_CHUNK = "nextChunk",
  PREV_CHUNK = "prevChunk",
  SELECT_OPTION_FROM_DROPDOWN = "selectOptionFromDropdown",
  HOVER = "hover",
  DOUBLE_CLICK = "doubleClick",
  DRAG_AND_DROP = "dragAndDrop",
}


================================================
FILE: packages/core/lib/v3/types/private/index.ts
================================================
export * from "./api.js";
export * from "./handlers.js";
export * from "./internal.js";
export * from "./evaluator.js";
export * from "./cache.js";
export * from "./agent.js";
export * from "./snapshot.js";


================================================
FILE: packages/core/lib/v3/types/private/internal.ts
================================================
import Browserbase from "@browserbasehq/sdk";
import { LaunchedChrome } from "chrome-launcher";

export type InitState =
  | { kind: "UNINITIALIZED" }
  | {
      kind: "LOCAL";
      chrome: LaunchedChrome;
      ws: string;
      userDataDir?: string;
      createdTempProfile?: boolean;
      preserveUserDataDir?: boolean;
    }
  | { kind: "BROWSERBASE"; bb: Browserbase; sessionId: string; ws: string };

export type EncodedId = `${number}-${number}`;

/**
 * Represents a path through a Zod schema from the root object down to a
 * particular field. The `segments` array describes the chain of keys/indices.
 *
 * - **String** segments indicate object property names.
 * - **Number** segments indicate array indices.
 *
 * For example, `["users", 0, "homepage"]` might describe reaching
 * the `homepage` field in `schema.users[0].homepage`.
 */
export interface ZodPathSegments {
  /**
   * The ordered list of keys/indices leading from the schema root
   * to the targeted field.
   */
  segments: Array<string | number>;
}

export type InitScriptSource<Arg> =
  | string
  | { path?: string; content?: string }
  | ((arg: Arg) => unknown);


================================================
FILE: packages/core/lib/v3/types/private/locator.ts
================================================
import { Buffer } from "buffer";

export interface NormalizedFilePayload {
  name: string;
  mimeType: string;
  buffer: Buffer;
  lastModified: number;
  /** Absolute path to the source file when provided by the caller. */
  absolutePath?: string;
}


================================================
FILE: packages/core/lib/v3/types/private/network.ts
================================================
import { Protocol } from "devtools-protocol";

/** Metadata tracked for each network request currently in-flight. */
export type NetworkRequestInfo = {
  sessionId: string;
  requestId: string;
  requestKey: string;
  frameId?: string;
  loaderId?: string;
  url?: string;
  timestamp: number;
  resourceType?: Protocol.Network.ResourceType;
  documentRequest: boolean;
};

/** Callback hooks consumers can implement to observe network transitions. */
export interface NetworkObserver {
  onRequestStarted(info: NetworkRequestInfo): void;
  onRequestFinished(info: NetworkRequestInfo): void;
  onRequestFailed(info: NetworkRequestInfo): void;
}

/** Options for the idle waiter helper. */
export type WaitForIdleOptions = {
  startTime?: number;
  timeoutMs: number;
  idleTimeMs?: number;
  filter?: (info: NetworkRequestInfo) => boolean;
  totalBudgetMs?: number;
};

export const DEFAULT_IDLE_WAIT = 500;
export const IGNORED_RESOURCE_TYPES = new Set<
  Protocol.Network.ResourceType | undefined
>(["EventSource", "WebSocket"]);

/** The handle returned by the network manager idle helper. */
export type WaitForIdleHandle = {
  promise: Promise<void>;
  dispose: () => void;
};


================================================
FILE: packages/core/lib/v3/types/private/shutdown.ts
================================================
/**
 * Internal-only types for the shutdown supervisor process.
 */

export type ShutdownSupervisorConfig =
  | {
      kind: "LOCAL";
      pid: number;
      userDataDir?: string;
      createdTempProfile?: boolean;
      preserveUserDataDir?: boolean;
    }
  | {
      kind: "STAGEHAND_API";
      sessionId: string;
      apiKey: string;
      projectId?: string;
    };

export interface ShutdownSupervisorHandle {
  /** Best-effort signal to stop the supervisor process. */
  stop: () => void;
}


================================================
FILE: packages/core/lib/v3/types/private/shutdownErrors.ts
================================================
/**
 * Internal-only errors for the shutdown supervisor.
 */

export class ShutdownSupervisorError extends Error {
  constructor(message: string) {
    super(message);
    this.name = "ShutdownSupervisorError";
  }
}

export class ShutdownSupervisorResolveError extends ShutdownSupervisorError {
  constructor(message: string) {
    super(message);
    this.name = "ShutdownSupervisorResolveError";
  }
}

export class ShutdownSupervisorSpawnError extends ShutdownSupervisorError {
  constructor(message: string) {
    super(message);
    this.name = "ShutdownSupervisorSpawnError";
  }
}


================================================
FILE: packages/core/lib/v3/types/private/snapshot.ts
================================================
/**
 * Options that control how hybrid snapshots and targeted scopes are captured.
 */
export type SnapshotOptions = {
  /**
   * Filter the snapshot to a specific element/subtree using a selector that can cross iframes.
   * Supports XPath (prefixed with `xpath=` or starting with `/`) and CSS with iframe hops via `>>`.
   */
  focusSelector?: string;
  /**
   * Pierce shadow DOM when calling DOM.getDocument. Defaults to true to retain the
   * existing behaviour.
   */
  pierceShadow?: boolean;
  /**
   * Toggle whether iframe subtrees are included in the merged snapshot. Defaults to true.
   */
  includeIframes?: boolean;
  /**
   * Optional feature flag that surfaces experimental traversal tweaks in the Accessibility layer.
   */
  experimental?: boolean;
};

/**
 * Hybrid snapshot payload consumed by act/extract/observe handlers.
 */
export type HybridSnapshot = {
  /** Merged outline across every frame. */
  combinedTree: string;
  /** EncodedId (frameOrdinal-backendNodeId) -> absolute XPath. */
  combinedXpathMap: Record<string, string>;
  /** EncodedId -> URL extracted from AX properties. */
  combinedUrlMap: Record<string, string>;
  /** Per-frame payloads expose the original relative data for debugging. */
  perFrame?: PerFrameSnapshot[];
};

export type PerFrameSnapshot = {
  frameId: string;
  outline: string;
  xpathMap: Record<string, string>;
  urlMap: Record<string, string>;
};

/**
 * Compact encoding of DOM data for an entire session. Shared between capture
 * and focus helpers so DOM traversal can be unit tested in isolation.
 */
export type SessionDomIndex = {
  rootBackend: number;
  absByBe: Map<number, string>;
  tagByBe: Map<number, string>;
  scrollByBe: Map<number, boolean>;
  docRootOf: Map<number, number>;
  contentDocRootByIframe: Map<number, number>;
};

export type FrameDomMaps = {
  tagNameMap: Record<string, string>;
  xpathMap: Record<string, string>;
  scrollableMap: Record<string, boolean>;
  urlMap: Record<string, string>;
};

export type ResolvedLocation = {
  frameId: string;
  backendNodeId: number;
  absoluteXPath: string;
};

export type ResolvedFocusFrame = {
  targetFrameId: string;
  tailXPath: string;
  absPrefix: string;
};

export type ResolvedCssFocus = {
  targetFrameId: string;
  tailSelector: string;
  absPrefix: string;
};

export type Axis = "child" | "desc";

export type Step = {
  axis: Axis;
  raw: string;
  name: string;
};

export type A11yNode = {
  role: string;
  name?: string;
  description?: string;
  value?: string | number | boolean;
  nodeId: string;
  backendDOMNodeId?: number;
  parentId?: string;
  childIds?: string[];
  children?: A11yNode[];
  encodedId?: string;
};

export type A11yOptions = {
  focusSelector?: string;
  experimental: boolean;
  tagNameMap: Record<string, string>;
  scrollableMap: Record<string, boolean>;
  encode: (backendNodeId: number) => string;
};

export type AccessibilityTreeResult = {
  outline: string;
  urlMap: Record<string, string>;
  scopeApplied: boolean;
};

export type FrameParentIndex = Map<string, string | null>;

/**
 * Shared frame metadata that every snapshot step needs.
 * - `rootId`: stable identifier for the main frame so we can detect root prefixes.
 * - `parentByFrame`: lookup table for iframe parentage (used by focus scoping and prefixing).
 * - `frames`: DFS-ordered frame ids so merging walks parents before children.
 */
export type FrameContext = {
  rootId: string;
  parentByFrame: FrameParentIndex;
  frames: string[];
};


================================================
FILE: packages/core/lib/v3/types/public/agent.ts
================================================
import type { Client } from "@modelcontextprotocol/sdk/client/index.js";
import {
  ToolSet,
  ModelMessage,
  wrapLanguageModel,
  StreamTextResult,
  StepResult,
  PrepareStepFunction,
  GenerateTextOnStepFinishCallback,
  StreamTextOnStepFinishCallback,
  StreamTextOnErrorCallback,
  StreamTextOnChunkCallback,
  StreamTextOnFinishCallback,
} from "ai";
import { LogLine } from "./logs.js";
import { ClientOptions } from "./model.js";
import { StagehandZodObject } from "../../zodCompat.js";

// Re-export ModelMessage for consumers who want to use it for conversation continuation
export type { ModelMessage } from "ai";

// Re-export Tool type for consumers who want to define custom tools
export type { Tool } from "ai";
import { Page as PlaywrightPage } from "playwright-core";
import { Page as PuppeteerPage } from "puppeteer-core";
import { Page as PatchrightPage } from "patchright-core";
import { Page } from "../../understudy/page.js";

// =============================================================================
// Variable Types
// =============================================================================

/**
 * A variable value can be a simple primitive or a rich object with an optional description.
 * This unified type is shared across `act`, `agent.execute`, and other methods.
 *
 * @example Simple (backward-compatible):
 * ```typescript
 * variables: { username: "john@example.com" }
 * ```
 *
 * @example Rich with description (useful for agents):
 * ```typescript
 * variables: {
 *   username: { value: "john@example.com", description: "The login email" }
 * }
 * ```
 */
export type VariableValue =
  | string
  | number
  | boolean
  | { value: string | number | boolean; description?: string };

/**
 * A collection of named variables for use in act, agent, and other methods.
 */
export type Variables = Record<string, VariableValue>;

export interface AgentContext {
  options: AgentExecuteOptionsBase;
  maxSteps: number;
  systemPrompt: string;
  allTools: ToolSet;
  messages: ModelMessage[];
  wrappedModel: ReturnType<typeof wrapLanguageModel>;
  initialPageUrl: string;
}

export interface AgentState {
  collectedReasoning: string[];
  actions: AgentAction[];
  finalMessage: string;
  completed: boolean;
  currentPageUrl: string;
}

export interface AgentAction {
  type: string;
  reasoning?: string;
  taskCompleted?: boolean;
  action?: string;
  // Tool-specific fields
  timeMs?: number; // wait tool
  pageText?: string; // ariaTree tool
  pageUrl?: string; // ariaTree tool
  instruction?: string; // various tools
  [key: string]: unknown;
}

export interface AgentResult {
  success: boolean;
  message: string;
  actions: AgentAction[];
  completed: boolean;
  metadata?: Record<string, unknown>;
  usage?: {
    input_tokens: number;
    output_tokens: number;
    reasoning_tokens?: number;
    cached_input_tokens?: number;
    inference_time_ms: number;
  };
  /**
   * The conversation messages from this execution.
   * Pass these to a subsequent execute() call via the `messages` option to continue the conversation.
   * @experimental
   */
  messages?: ModelMessage[];
  /**
   * Custom output data extracted based on the `output` schema provided in execute options.
   * Only populated if an `output` schema was provided.
   * @experimental
   */
  output?: Record<string, unknown>;
}

export type AgentStreamResult = StreamTextResult<ToolSet, never> & {
  result: Promise<AgentResult>;
};

/**
 * Base callbacks shared between execute (non-streaming) and streaming modes.
 */
export interface AgentCallbacks {
  /**
   * Optional function called before each step to modify settings.
   * You can change the model, tool choices, active tools, system prompt,
   * and input messages for each step.
   */
  prepareStep?: PrepareStepFunction<ToolSet>;
  /**
   * Callback called when each step (LLM call) is finished.
   * This is called for intermediate steps as well as the final step.
   */
  onStepFinish?:
    | GenerateTextOnStepFinishCallback<ToolSet>
    | StreamTextOnStepFinishCallback<ToolSet>;
}

/**
 * Error message type for streaming-only callbacks used in non-streaming mode.
 * This provides a clear error message when users try to use streaming callbacks without stream: true.
 */
type StreamingCallbackNotAvailable =
  "This callback requires 'stream: true' in AgentConfig. Set stream: true to use streaming callbacks like onChunk, onFinish, onError, and onAbort.";

/**
 * Error message for safety confirmation callback misuse.
 * Safety confirmations are only available for non-streaming CUA agent executions.
 */
type SafetyConfirmationCallbackNotAvailable =
  "Safety confirmation callbacks are only available via non-streaming AgentExecuteOptions.callbacks when using mode: 'cua'.";

/**
 * Callbacks specific to the non-streaming execute method.
 */
export interface AgentExecuteCallbacks extends AgentCallbacks {
  /**
   * Callback called when each step (LLM call) is finished.
   */
  onStepFinish?: GenerateTextOnStepFinishCallback<ToolSet>;
  /**
   * Callback for handling safety confirmation requests from CUA providers.
   * Only available when running an agent configured with mode: "cua".
   */
  onSafetyConfirmation?: SafetyConfirmationHandler;

  /**
   * NOT AVAILABLE in non-streaming mode.
   * This callback requires `stream: true` in AgentConfig.
   *
   * @example
   * ```typescript
   * // Enable streaming to use onChunk:
   * const agent = stagehand.agent({ stream: true });
   * await agent.execute({
   *   instruction: "...",
   *   callbacks: { onChunk: async (chunk) => console.log(chunk) }
   * });
   * ```
   */
  onChunk?: StreamingCallbackNotAvailable;

  /**
   * NOT AVAILABLE in non-streaming mode.
   * This callback requires `stream: true` in AgentConfig.
   *
   * @example
   * ```typescript
   * // Enable streaming to use onFinish:
   * const agent = stagehand.agent({ stream: true });
   * await agent.execute({
   *   instruction: "...",
   *   callbacks: { onFinish: (event) => console.log("Done!", event) }
   * });
   * ```
   */
  onFinish?: StreamingCallbackNotAvailable;

  /**
   * NOT AVAILABLE in non-streaming mode.
   * This callback requires `stream: true` in AgentConfig.
   *
   * @example
   * ```typescript
   * // Enable streaming to use onError:
   * const agent = stagehand.agent({ stream: true });
   * await agent.execute({
   *   instruction: "...",
   *   callbacks: { onError: ({ error }) => console.error(error) }
   * });
   * ```
   */
  onError?: StreamingCallbackNotAvailable;

  /**
   * NOT AVAILABLE in non-streaming mode.
   * This callback requires `stream: true` in AgentConfig.
   *
   * @example
   * ```typescript
   * // Enable streaming to use onAbort:
   * const agent = stagehand.agent({ stream: true });
   * await agent.execute({
   *   instruction: "...",
   *   callbacks: { onAbort: (event) => console.log("Aborted", event.steps) }
   * });
   * ```
   */
  onAbort?: StreamingCallbackNotAvailable;
}

/**
 * Callbacks specific to the streaming mode.
 */
export interface AgentStreamCallbacks extends AgentCallbacks {
  /**
   * Callback called when each step (LLM call) is finished during streaming.
   */
  onStepFinish?: StreamTextOnStepFinishCallback<ToolSet>;
  /**
   * Callback called when an error occurs during streaming.
   * Use this to log errors or handle error states.
   */
  onError?: StreamTextOnErrorCallback;
  /**
   * Callback called for each chunk of the stream.
   * Stream processing will pause until the callback promise resolves.
   */
  onChunk?: StreamTextOnChunkCallback<ToolSet>;
  /**
   * Callback called when the stream finishes.
   */
  onFinish?: StreamTextOnFinishCallback<ToolSet>;
  /**
   * Callback called when the stream is aborted.
   */
  onAbort?: (event: {
    steps: Array<StepResult<ToolSet>>;
  }) => PromiseLike<void> | void;
  /**
   * NOT AVAILABLE in streaming mode.
   * Safety confirmations currently require non-streaming execute() on CUA agents.
   */
  onSafetyConfirmation?: SafetyConfirmationCallbackNotAvailable;
}

/**
 * Base options for agent execution (without callbacks).
 */
export interface AgentExecuteOptionsBase {
  instruction: string;
  maxSteps?: number;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  highlightCursor?: boolean;
  /**
   * Previous conversation messages to continue from.
   * Pass the `messages` from a previous AgentResult to continue that conversation.
   * @experimental
   */
  messages?: ModelMessage[];
  /**
   * An AbortSignal that can be used to cancel the agent execution.
   * When aborted, the agent will stop and return a partial result.
   * @experimental
   *
   * @example
   * ```typescript
   * const controller = new AbortController();
   * setTimeout(() => controller.abort(), 30000); // 30 second timeout
   *
   * const result = await agent.execute({
   *   instruction: "...",
   *   signal: controller.signal
   * });
   * ```
   */
  signal?: AbortSignal;
  /**
   * Tools to exclude from this execution.
   * Pass an array of tool names to prevent the agent from using those tools.
   *
   * **Note:** Not supported in CUA mode (`mode: "cua"`).
   *
   * **Available tools by mode:**
   *
   * **DOM mode (default):**
   * - `act` - Perform semantic actions (click, type, etc.)
   * - `fillForm` - Fill form fields using DOM selectors
   * - `ariaTree` - Get accessibility tree of the page
   * - `extract` - Extract structured data from page
   * - `goto` - Navigate to a URL
   * - `scroll` - Scroll using semantic directions (up/down/left/right)
   * - `keys` - Press keyboard keys
   * - `navback` - Navigate back in history
   * - `screenshot` - Take a screenshot
   * - `think` - Agent reasoning/planning step
   * - `wait` - Wait for time or condition
   * - `done` - Mark task as complete
   * - `search` - Web search (requires useSearch: true and BROWSERBASE_API_KEY)
   *
   * **Hybrid mode:**
   * - `click` - Click at specific coordinates
   * - `type` - Type text at coordinates
   * - `dragAndDrop` - Drag from one point to another
   * - `clickAndHold` - Click and hold at coordinates
   * - `fillFormVision` - Fill forms using vision/coordinates
   * - `act` - Perform semantic actions
   * - `ariaTree` - Get accessibility tree
   * - `extract` - Extract data from page
   * - `goto` - Navigate to URL
   * - `scroll` - Scroll using coordinates
   * - `keys` - Press keyboard keys
   * - `navback` - Navigate back
   * - `screenshot` - Take screenshot
   * - `think` - Agent reasoning step
   * - `wait` - Wait for time/condition
   * - `done` - Mark task complete
   * - `search` - Web search (requires useSearch: true and BROWSERBASE_API_KEY)
   *
   * @experimental
   * @example
   * ```typescript
   * // Exclude screenshot and extract tools
   * const result = await agent.execute({
   *   instruction: "Click the submit button",
   *   excludeTools: ["screenshot", "extract"]
   * });
   * ```
   */
  excludeTools?: string[];
  /**
   * A Zod schema defining custom output data to return when the task completes.
   * The agent will populate this data in the final done tool call.
   *
   * @experimental
   * @example
   * ```typescript
   * const result = await agent.execute({
   *   instruction: "Find the cheapest flight from NYC to LA",
   *   output: z.object({
   *     price: z.string().describe("The price of the flight"),
   *     airline: z.string().describe("The airline name"),
   *     departureTime: z.string().describe("Departure time"),
   *   }),
   * });
   *
   * console.log(result.output); // { price: "$199", airline: "Delta", departureTime: "8:00 AM" }
   * ```
   */
  output?: StagehandZodObject;
  /**
   * Variables that the agent can use when filling forms or typing text.
   * The agent will see variable names and descriptions in the system prompt,
   * and can use them via `%variableName%` syntax in act/type/fillForm tool calls.
   *
   * Accepts both simple values and rich objects with descriptions (same type as `act`).
   *
   * **Note:** Not supported in CUA mode (`mode: "cua"`). Requires `experimental: true`.
   *
   * @experimental
   * @example
   * ```typescript
   * // Simple values
   * variables: { username: "john@example.com", password: "secret123" }
   *
   * // Rich values with descriptions (helps the agent understand context)
   * variables: {
   *   username: { value: "john@example.com", description: "The login email" },
   *   password: { value: "secret123", description: "The login password" },
   * }
   * ```
   */
  variables?: Variables;
  /**
   * Timeout in milliseconds for each agent tool call.
   * If a tool call exceeds this duration, it will be aborted and
   * reported back to the LLM as a timeout error so it can retry or adjust.
   * For tools that call v3 methods (act, extract, fillForm, ariaTree), the
   * timeout is also forwarded to the underlying v3 call for true cancellation.
   * @default 45000 (45 seconds)
   */
  toolTimeout?: number;
  /**
   * Enable the web search tool powered by Browserbase Search API.
   * Requires a valid Browserbase API key (BROWSERBASE_API_KEY).
   * When set to true, the agent gains access to a `search` tool for web searches.
   *
   * @example
   * ```typescript
   * const result = await agent.execute({
   *   instruction: "Find the latest news about AI",
   *   useSearch: true,
   * });
   * ```
   */
  useSearch?: boolean;
}

/**
 * Options for non-streaming agent execution.
 * Only accepts AgentExecuteCallbacks (no streaming-specific callbacks like onChunk, onFinish).
 */
export interface AgentExecuteOptions extends AgentExecuteOptionsBase {
  /**
   * Callbacks for non-streaming agent execution.
   * For streaming callbacks (onChunk, onFinish, onError, onAbort), use stream: true in AgentConfig.
   */
  callbacks?: AgentExecuteCallbacks;
}

/**
 * Options for streaming agent execution.
 * Accepts AgentStreamCallbacks including onChunk, onFinish, onError, and onAbort.
 */
export interface AgentStreamExecuteOptions extends AgentExecuteOptionsBase {
  /**
   * Callbacks for streaming agent execution.
   * Includes streaming-specific callbacks: onChunk, onFinish, onError, onAbort.
   */
  callbacks?: AgentStreamCallbacks;
}
export type AgentType =
  | "openai"
  | "anthropic"
  | "google"
  | "microsoft"
  | "bedrock";

export const AVAILABLE_CUA_MODELS = [
  "openai/computer-use-preview",
  "openai/computer-use-preview-2025-03-11",
  "anthropic/claude-opus-4-5-20251101",
  "anthropic/claude-opus-4-6",
  "anthropic/claude-sonnet-4-6",
  "anthropic/claude-haiku-4-5-20251001",
  "anthropic/claude-sonnet-4-20250514",
  "anthropic/claude-sonnet-4-5-20250929",
  "google/gemini-2.5-computer-use-preview-10-2025",
  "google/gemini-3-flash-preview",
  "google/gemini-3-pro-preview",
  "microsoft/fara-7b",
] as const;
export type AvailableCuaModel = (typeof AVAILABLE_CUA_MODELS)[number];

export interface AgentExecutionOptions<
  TOptions extends AgentExecuteOptions = AgentExecuteOptions,
> {
  options: TOptions;
  logger: (message: LogLine) => void;
  retries?: number;
}

export interface AgentHandlerOptions {
  modelName: string;
  clientOptions?: ClientOptions;
  userProvidedInstructions?: string;
  experimental?: boolean;
}

export interface ActionExecutionResult {
  success: boolean;
  error?: string;
  data?: unknown;
}

/**
 * Represents a safety check that requires user confirmation before proceeding.
 * These are issued by CUA providers (OpenAI, Google) when the agent attempts
 * potentially risky actions.
 */
export interface SafetyCheck {
  /** Unique identifier for this safety check */
  id: string;
  /** Code identifying the type of safety concern */
  code: string;
  /** Human-readable description of the safety concern */
  message: string;
}

/**
 * Response from the user for a safety confirmation request.
 */
export interface SafetyConfirmationResponse {
  /** Whether the user acknowledged/approved the safety checks */
  acknowledged: boolean;
}

/**
 * Callback for handling safety confirmation requests.
 * Called when the CUA provider issues safety checks that require user confirmation.
 * The callback should return a promise that resolves when the user has made a decision.
 *
 * @param safetyChecks - Array of safety checks requiring confirmation
 * @returns Promise resolving to the user's response
 *
 * @example
 * ```typescript
 * const agent = stagehand.agent({
 *   mode: "cua",
 * });
 * await agent.execute({
 *   instruction: "...",
 *   callbacks: {
 *     onSafetyConfirmation: async (checks) => {
 *       console.log("Safety checks:", checks);
 *       const userApproved = await showConfirmationDialog(checks);
 *       return { acknowledged: userApproved };
 *     },
 *   },
 * });
 * ```
 */
export type SafetyConfirmationHandler = (
  safetyChecks: SafetyCheck[],
) => Promise<SafetyConfirmationResponse>;

// Anthropic types:

export interface ToolUseItem extends ResponseItem {
  type: "tool_use";
  id: string; // This is the correct property name from Anthropic's API
  name: string; // Name of the tool being used
  input: Record<string, unknown>;
}

export interface AnthropicMessage {
  role: string;
  content: string | Array<AnthropicContentBlock>;
}

export interface AnthropicContentBlock {
  type: string;
  [key: string]: unknown;
}

export interface AnthropicTextBlock extends AnthropicContentBlock {
  type: "text";
  text: string;
}

export interface AnthropicToolResult {
  type: "tool_result";
  tool_use_id: string;
  content: string | Array<AnthropicContentBlock>;
}

// OpenAI types:

export interface ResponseItem {
  type: string;
  id: string;
  [key: string]: unknown;
}

export interface ComputerCallItem extends ResponseItem {
  type: "computer_call";
  call_id: string;
  action: {
    type: string;
    [key: string]: unknown;
  };
  pending_safety_checks?: Array<{
    id: string;
    code: string;
    message: string;
  }>;
}

export interface FunctionCallItem extends ResponseItem {
  type: "function_call";
  call_id: string;
  name: string;
  arguments: string;
}

export type ResponseInputItem =
  | { role: string; content: string }
  | {
      type: "computer_call_output";
      call_id: string;
      output:
        | {
            type: "input_image";
            image_url: string;
            current_url?: string;
            error?: string;
            [key: string]: unknown;
          }
        | string;
      acknowledged_safety_checks?: Array<{
        id: string;
        code: string;
        message: string;
      }>;
    }
  | {
      type: "function_call_output";
      call_id: string;
      output: string;
    };

export interface AgentInstance {
  execute: (
    instructionOrOptions: string | AgentExecuteOptions,
  ) => Promise<AgentResult>;
}

export type AgentProviderType = AgentType;

export type AgentModelConfig<TModelName extends string = string> = {
  modelName: TModelName;
} & Record<string, unknown>;

/**
 * Agent tool mode determines which set of tools are available to the agent.
 * - 'dom': Uses DOM-based tools (act, fillForm) - better for structured page interactions
 * - 'hybrid': Uses coordinate-based tools (click, type, dragAndDrop, etc.) - better for visual/screenshot-based interactions
 * - 'cua': Uses Computer Use Agent (CUA) providers like Anthropic Claude or Google Gemini for screenshot-based automation
 */
export type AgentToolMode = "dom" | "hybrid" | "cua";

export type AgentConfig = {
  /**
   * Custom system prompt to provide to the agent. Overrides the default system prompt.
   */
  systemPrompt?: string;
  /**
   * MCP integrations - Array of Client objects
   */
  integrations?: (Client | string)[];
  /**
   * Tools passed to the agent client
   */
  tools?: ToolSet;
  /**
   * @deprecated Use `mode: "cua"` instead. This option will be removed in a future version.
   * Enables Computer Use Agent (CUA) mode.
   */
  cua?: boolean;
  /**
   * The model to use for agent functionality
   */
  model?: string | AgentModelConfig<string>;
  /**
   * The model to use for tool execution (observe/act calls within agent tools).
   * If not specified, inherits from the main model configuration.
   * Format: "provider/model" (e.g., "openai/gpt-4o-mini", "google/gemini-2.0-flash-exp")
   */
  executionModel?: string | AgentModelConfig<string>;
  /**
   * Enable streaming mode for the agent.
   * When true, execute() returns AgentStreamResult with textStream for incremental output.
   * When false (default), execute() returns AgentResult after completion.
   */
  stream?: boolean;
  /**
   * Tool mode for the agent. Determines which set of tools are available.
   * - 'dom' (default): Uses DOM-based tools (act, fillForm) for structured interactions
   * - 'hybrid': Uses coordinate-based tools (click, type, dragAndDrop, clickAndHold, fillFormVision)
   *             for visual/screenshot-based interactions
   * - 'cua': Uses Computer Use Agent (CUA) providers for screenshot-based automation
   */
  mode?: AgentToolMode;
};

/**
 * Agent instance returned when stream: true is set in AgentConfig.
 * execute() returns a streaming result that can be consumed incrementally.
 * Accepts AgentStreamExecuteOptions with streaming-specific callbacks.
 */
export interface StreamingAgentInstance {
  execute: (
    instructionOrOptions: string | AgentStreamExecuteOptions,
  ) => Promise<AgentStreamResult>;
}

/**
 * Agent instance returned when stream is false or not set in AgentConfig.
 * execute() returns a result after the agent completes.
 * Accepts AgentExecuteOptions with non-streaming callbacks only.
 */
export interface NonStreamingAgentInstance {
  execute: (
    instructionOrOptions: string | AgentExecuteOptions,
  ) => Promise<AgentResult>;
}

// =============================================================================
// Vision Action Tool Result Types
// =============================================================================

/**
 * Content item type for toModelOutput return values.
 * Used in tool definitions to return text and/or media to the model.
 */
export type ModelOutputContentItem =
  | { type: "text"; text: string }
  | { type: "media"; mediaType: string; data: string };

export interface ClickToolResult {
  success: boolean;
  describe?: string;
  coordinates?: number[];
  error?: string;
  screenshotBase64?: string;
}

export interface TypeToolResult {
  success: boolean;
  describe?: string;
  text?: string;
  error?: string;
  screenshotBase64?: string;
}

export interface DragAndDropToolResult {
  success: boolean;
  describe?: string;
  error?: string;
  screenshotBase64?: string;
}

export interface FillFormField {
  action: string;
  value: string;
  coordinates: { x: number; y: number };
}

export interface FillFormVisionToolResult {
  success: boolean;
  playwrightArguments?: FillFormField[];
  error?: string;
  screenshotBase64?: string;
}

export interface ScrollToolResult {
  success: boolean;
  message: string;
  scrolledPixels: number;
  error?: string;
}

export interface ScrollVisionToolResult extends ScrollToolResult {
  screenshotBase64?: string;
}

export interface WaitToolResult {
  success: boolean;
  waited: number;
  screenshotBase64?: string;
  error?: string;
}


================================================
FILE: packages/core/lib/v3/types/public/api.ts
================================================
/**
 * Centralized Zod schemas for Stagehand Server API
 *
 * Naming conventions:
 * - `*RequestSchema` - Request body schemas (zod4), `*Request` is the inferred type
 * - `*ResultSchema` - Inner response data (unwrapped), `*Result` is the inferred type
 * - `*ResponseSchema` - Full response with success wrapper: { success: true, data: *Result }, `*Response` is the inferred type
 *
 * All TypeScript types are inferred from the Zod4 *Schemas using z.infer<>
 */
import { z } from "zod/v4";
import type Browserbase from "@browserbasehq/sdk";

// =============================================================================
// Shared Components
// =============================================================================

/** Browser launch options for local browsers */
export const LocalBrowserLaunchOptionsSchema = z
  .object({
    args: z.array(z.string()).optional(),
    executablePath: z.string().optional(),
    port: z.number().optional(),
    userDataDir: z.string().optional(),
    preserveUserDataDir: z.boolean().optional(),
    headless: z.boolean().optional(),
    devtools: z.boolean().optional(),
    chromiumSandbox: z.boolean().optional(),
    ignoreDefaultArgs: z.union([z.boolean(), z.array(z.string())]).optional(),
    proxy: z
      .object({
        server: z.string(),
        bypass: z.string().optional(),
        username: z.string().optional(),
        password: z.string().optional(),
      })
      .optional(),
    locale: z.string().optional(),
    viewport: z.object({ width: z.number(), height: z.number() }).optional(),
    deviceScaleFactor: z.number().optional(),
    hasTouch: z.boolean().optional(),
    ignoreHTTPSErrors: z.boolean().optional(),
    cdpUrl: z.string().optional(),
    cdpHeaders: z.record(z.string(), z.string()).optional(),
    connectTimeoutMs: z.number().optional(),
    downloadsPath: z.string().optional(),
    acceptDownloads: z.boolean().optional(),
  })
  .strict()
  .meta({ id: "LocalBrowserLaunchOptions" });

/** Detailed model configuration object */
export const ModelConfigObjectSchema = z
  .object({
    provider: z
      .enum(["openai", "anthropic", "google", "microsoft", "bedrock"])
      .optional()
      .meta({
        description:
          "AI provider for the model (or provide a baseURL endpoint instead)",
        example: "openai",
      }),
    modelName: z.string().meta({
      description:
        "Model name string with provider prefix (e.g., 'openai/gpt-5-nano')",
      example: "openai/gpt-5-nano",
    }),
    apiKey: z.string().optional().meta({
      description: "API key for the model provider",
      example: "sk-some-openai-api-key",
    }),
    baseURL: z.string().url().optional().meta({
      description: "Base URL for the model provider",
      example: "https://api.openai.com/v1",
    }),
  })
  .meta({ id: "ModelConfigObject" });

/** Model configuration */
export const ModelConfigSchema = ModelConfigObjectSchema.meta({
  id: "ModelConfig",
});

/** Action object returned by observe and used by act */
export const ActionSchema = z
  .object({
    selector: z.string().meta({
      description: "CSS selector or XPath for the element",
      example: "[data-testid='submit-button']",
    }),
    description: z.string().meta({
      description: "Human-readable description of the action",
      example: "Click the submit button",
    }),
    backendNodeId: z.number().optional().meta({
      description: "Backend node ID for the element",
    }),
    method: z.string().optional().meta({
      description: "The method to execute (click, fill, etc.)",
      example: "click",
    }),
    arguments: z
      .array(z.string())
      .optional()
      .meta({
        description: "Arguments to pass to the method",
        example: ["Hello World"],
      }),
  })
  .meta({
    id: "Action",
    description: "Action object returned by observe and used by act",
  });

/** Session ID path parameter */
export const SessionIdParamsSchema = z
  .object({
    id: z.string().meta({
      description: "Unique session identifier",
      example: "c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123",
    }),
  })
  .strict()
  .meta({ id: "SessionIdParams" });

/** Browser configuration for session start */
export const BrowserConfigSchema = z
  .object({
    type: z.enum(["local", "browserbase"]).optional().meta({
      description: "Browser type to use",
      example: "local",
    }),
    cdpUrl: z.string().optional().meta({
      description:
        "Chrome DevTools Protocol URL for connecting to existing browser",
      example: "ws://localhost:9222",
    }),
    launchOptions: LocalBrowserLaunchOptionsSchema.optional(),
  })
  .meta({ id: "BrowserConfig" });

// =============================================================================
// Request Headers (operational only - auth headers are in security schemes)
// =============================================================================

/** Operational headers for all session requests (auth handled via security schemes) */
export const SessionHeadersSchema = z
  .object({
    "x-stream-response": z.enum(["true", "false"]).optional().meta({
      description: "Whether to stream the response via SSE",
      example: "true",
    }),
  })
  .meta({ id: "SessionHeaders" });

// =============================================================================
// Response Wrapper Helper
// =============================================================================

/** Wraps a result schema in standard success response format */
const wrapResponse = <T extends z.ZodTypeAny>(resultSchema: T, name: string) =>
  z
    .object({
      success: z.boolean().meta({
        description: "Indicates whether the request was successful",
      }),
      data: resultSchema,
    })
    .meta({ id: name });

/** Standard error response */
export const ErrorResponseSchema = z
  .object({
    success: z.literal(false),
    error: z.string(),
    code: z.string().optional(),
  })
  .strict()
  .meta({ id: "ErrorResponse" });

// =============================================================================
// Browserbase Session Create Params  (zod+hints duplicated version of Browserbase.Sessions.SessionCreateParams)
// =============================================================================

/** Browserbase viewport configuration */
export const BrowserbaseViewportSchema = z
  .object({
    width: z.number().optional(),
    height: z.number().optional(),
  })
  .meta({ id: "BrowserbaseViewport" });

/** Browserbase fingerprint screen configuration */
export const BrowserbaseFingerprintScreenSchema = z
  .object({
    maxHeight: z.number().optional(),
    maxWidth: z.number().optional(),
    minHeight: z.number().optional(),
    minWidth: z.number().optional(),
  })
  .meta({ id: "BrowserbaseFingerprintScreen" });

/** Browserbase fingerprint configuration for stealth mode */
export const BrowserbaseFingerprintSchema = z
  .object({
    browsers: z
      .array(z.enum(["chrome", "edge", "firefox", "safari"]))
      .optional(),
    devices: z.array(z.enum(["desktop", "mobile"])).optional(),
    httpVersion: z.enum(["1", "2"]).optional(),
    locales: z.array(z.string()).optional(),
    operatingSystems: z
      .array(z.enum(["android", "ios", "linux", "macos", "windows"]))
      .optional(),
    screen: BrowserbaseFingerprintScreenSchema.optional(),
  })
  .meta({ id: "BrowserbaseFingerprint" });

/** Browserbase context configuration for session persistence */
export const BrowserbaseContextSchema = z
  .object({
    id: z.string(),
    persist: z.boolean().optional(),
  })
  .meta({ id: "BrowserbaseContext" });

/** Browserbase browser settings for session creation */
export const BrowserbaseBrowserSettingsSchema = z
  .object({
    advancedStealth: z.boolean().optional(),
    blockAds: z.boolean().optional(),
    context: BrowserbaseContextSchema.optional(),
    extensionId: z.string().optional(),
    fingerprint: BrowserbaseFingerprintSchema.optional(),
    logSession: z.boolean().optional(),
    recordSession: z.boolean().optional(),
    solveCaptchas: z.boolean().optional(),
    viewport: BrowserbaseViewportSchema.optional(),
  })
  .meta({ id: "BrowserbaseBrowserSettings" });

/** Browserbase managed proxy geolocation configuration */
export const BrowserbaseProxyGeolocationSchema = z
  .object({
    country: z.string(),
    city: z.string().optional(),
    state: z.string().optional(),
  })
  .meta({ id: "BrowserbaseProxyGeolocation" });

/** Browserbase managed proxy configuration */
export const BrowserbaseProxyConfigSchema = z
  .object({
    type: z.literal("browserbase"),
    domainPattern: z.string().optional(),
    geolocation: BrowserbaseProxyGeolocationSchema.optional(),
  })
  .meta({ id: "BrowserbaseProxyConfig" });

/** External proxy configuration */
export const ExternalProxyConfigSchema = z
  .object({
    type: z.literal("external"),
    server: z.string(),
    domainPattern: z.string().optional(),
    username: z.string().optional(),
    password: z.string().optional(),
  })
  .meta({ id: "ExternalProxyConfig" });

/** Union of proxy configuration types */
export const ProxyConfigSchema = z
  .discriminatedUnion("type", [
    BrowserbaseProxyConfigSchema,
    ExternalProxyConfigSchema,
  ])
  .meta({ id: "ProxyConfig" });

/** Browserbase region identifier for multi-region support */
export const BrowserbaseRegionSchema = z
  .enum(["us-west-2", "us-east-1", "eu-central-1", "ap-southeast-1"])
  .meta({ id: "BrowserbaseRegion" });

/** Browserbase session creation parameters */
export const BrowserbaseSessionCreateParamsSchema = z
  .object({
    projectId: z.string().optional(),
    browserSettings: BrowserbaseBrowserSettingsSchema.optional(),
    extensionId: z.string().optional(),
    keepAlive: z.boolean().optional(),
    proxies: z.union([z.boolean(), z.array(ProxyConfigSchema)]).optional(),
    region: BrowserbaseRegionSchema.optional(),
    timeout: z.number().optional(),
    userMetadata: z.record(z.string(), z.unknown()).optional(),
  })
  .meta({ id: "BrowserbaseSessionCreateParams" });

// =============================================================================
// Session Start
// =============================================================================

export const SessionStartRequestSchema = z
  .object({
    modelName: z.string().meta({
      description: "Model name to use for AI operations",
      example: "openai/gpt-4o",
    }),
    domSettleTimeoutMs: z.number().optional().meta({
      description: "Timeout in ms to wait for DOM to settle",
      example: 5000,
    }),
    verbose: z
      .union([z.literal(0), z.literal(1), z.literal(2)])
      .optional()
      .meta({
        description: "Logging verbosity level (0=quiet, 1=normal, 2=debug)",
        example: 1,
        override: ({ jsonSchema }: { jsonSchema: Record<string, unknown> }) => {
          delete jsonSchema.anyOf;
          delete jsonSchema.allOf;
          delete jsonSchema.oneOf;
          jsonSchema.type = "number";
          jsonSchema.enum = [0, 1, 2];
        },
      }),
    systemPrompt: z.string().optional().meta({
      description: "Custom system prompt for AI operations",
    }),
    browserbaseSessionCreateParams:
      BrowserbaseSessionCreateParamsSchema.optional(),
    browser: BrowserConfigSchema.optional(),
    selfHeal: z.boolean().optional().meta({
      description: "Enable self-healing for failed actions",
      example: true,
    }),
    browserbaseSessionID: z.string().optional().meta({
      description: "Existing Browserbase session ID to resume",
    }),
    // experimental is a V3 field but doesn't need to go over the wire - included because wire type imports options type
    experimental: z.boolean().optional(),
    // V2 compatibility fields - only included because the server imports this type and supports V2
    // should never be used in v3 clients or v3-only server implementations
    waitForCaptchaSolves: z.boolean().optional().meta({
      description: "Wait for captcha solves (deprecated, v2 only)",
    }),
    actTimeoutMs: z.number().optional().meta({
      description: "Timeout in ms for act operations (deprecated, v2 only)",
    }),
  })
  .meta({ id: "SessionStartRequest" });

export const SessionStartResultSchema = z
  .object({
    sessionId: z.string().meta({
      description: "Unique Browserbase session identifier",
      example: "c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123",
    }),
    cdpUrl: z.string().nullish().meta({
      description:
        "CDP WebSocket URL for connecting to the Browserbase cloud browser (present when available)",
      example: "wss://connect.browserbase.com/?signingKey=abc123",
    }),
    available: z.boolean(),
  })
  .meta({ id: "SessionStartResult" });

export const SessionStartResponseSchema = wrapResponse(
  SessionStartResultSchema,
  "SessionStartResponse",
);

// =============================================================================
// Session End
// =============================================================================

/** Session end request - no request body. */
export const SessionEndRequestSchema = z
  .object({})
  .strict()
  .optional()
  .meta({ id: "SessionEndRequest" });

export const SessionEndResultSchema = z
  .object({})
  .strict()
  .meta({ id: "SessionEndResult" });

/** Session end response - just success flag, no data wrapper */
export const SessionEndResponseSchema = z
  .object({
    success: z.boolean().meta({
      description: "Indicates whether the request was successful",
    }),
  })
  .strict()
  .meta({ id: "SessionEndResponse" });

// =============================================================================
// Act
// =============================================================================

export const ActOptionsSchema = z
  .object({
    model: z.union([ModelConfigSchema, z.string()]).optional().meta({
      description:
        "Model configuration object or model name string (e.g., 'openai/gpt-5-nano')",
    }),
    variables: z
      .record(z.string(), z.string())
      .optional()
      .meta({
        description: "Variables to substitute in the action instruction",
        example: { username: "john_doe" },
      }),
    timeout: z.number().optional().meta({
      description: "Timeout in ms for the action",
      example: 30000,
    }),
  })
  .optional()
  .meta({ id: "ActOptions" });

export const ActRequestSchema = z
  .object({
    input: z.string().or(ActionSchema).meta({
      description: "Natural language instruction or Action object",
      example: "Click the login button",
    }),
    options: ActOptionsSchema,
    frameId: z.string().nullish().meta({
      description: "Target frame ID for the action",
    }),
    streamResponse: z.boolean().optional().meta({
      description: "Whether to stream the response via SSE",
      example: true,
    }),
  })
  .meta({ id: "ActRequest" });

/** Inner act result data */
export const ActResultDataSchema = z
  .object({
    success: z.boolean().meta({
      description: "Whether the action completed successfully",
      example: true,
    }),
    message: z.string().meta({
      description: "Human-readable result message",
      example: "Successfully clicked the login button",
    }),
    actionDescription: z.string().meta({
      description: "Description of the action that was performed",
      example: "Clicked button with text 'Login'",
    }),
    actions: z.array(ActionSchema).meta({
      description: "List of actions that were executed",
    }),
  })
  .meta({ id: "ActResultData" });

export const ActResultSchema = z
  .object({
    result: ActResultDataSchema,
    actionId: z.string().optional().meta({
      description: "Action ID for tracking",
    }),
  })
  .meta({ id: "ActResult" });

export const ActResponseSchema = wrapResponse(ActResultSchema, "ActResponse");

// =============================================================================
// Extract
// =============================================================================

export const ExtractOptionsSchema = z
  .object({
    model: z.union([ModelConfigSchema, z.string()]).optional().meta({
      description:
        "Model configuration object or model name string (e.g., 'openai/gpt-5-nano')",
    }),
    timeout: z.number().optional().meta({
      description: "Timeout in ms for the extraction",
      example: 30000,
    }),
    selector: z.string().optional().meta({
      description: "CSS selector to scope extraction to a specific element",
      example: "#main-content",
    }),
  })
  .optional()
  .meta({ id: "ExtractOptions" });

export const ExtractRequestSchema = z
  .object({
    instruction: z.string().optional().meta({
      description: "Natural language instruction for what to extract",
      example: "Extract all product names and prices from the page",
    }),
    schema: z.record(z.string(), z.unknown()).optional().meta({
      description: "JSON Schema defining the structure of data to extract",
    }),
    options: ExtractOptionsSchema,
    frameId: z.string().nullish().meta({
      description: "Target frame ID for the extraction",
    }),
    streamResponse: z.boolean().optional().meta({
      description: "Whether to stream the response via SSE",
      example: true,
    }),
  })
  .meta({ id: "ExtractRequest" });

export const ExtractResultSchema = z
  .object({
    result: z.unknown().meta({
      description: "Extracted data matching the requested schema",
      override: ({ jsonSchema }: { jsonSchema: Record<string, unknown> }) => {
        jsonSchema["x-stainless-any"] = true;
      },
    }),
    actionId: z.string().optional().meta({
      description: "Action ID for tracking",
    }),
  })
  .meta({ id: "ExtractResult" });

export const ExtractResponseSchema = wrapResponse(
  ExtractResultSchema,
  "ExtractResponse",
);

// =============================================================================
// Observe
// =============================================================================

export const ObserveOptionsSchema = z
  .object({
    model: z.union([ModelConfigSchema, z.string()]).optional().meta({
      description:
        "Model configuration object or model name string (e.g., 'openai/gpt-5-nano')",
    }),
    timeout: z.number().optional().meta({
      description: "Timeout in ms for the observation",
      example: 30000,
    }),
    selector: z.string().optional().meta({
      description: "CSS selector to scope observation to a specific element",
      example: "nav",
    }),
  })
  .optional()
  .meta({ id: "ObserveOptions" });

export const ObserveRequestSchema = z
  .object({
    instruction: z.string().optional().meta({
      description: "Natural language instruction for what actions to find",
      example: "Find all clickable navigation links",
    }),
    options: ObserveOptionsSchema,
    frameId: z.string().nullish().meta({
      description: "Target frame ID for the observation",
    }),
    streamResponse: z.boolean().optional().meta({
      description: "Whether to stream the response via SSE",
      example: true,
    }),
  })
  .meta({ id: "ObserveRequest" });

export const ObserveResultSchema = z
  .object({
    result: z.array(ActionSchema),
    actionId: z.string().optional().meta({
      description: "Action ID for tracking",
    }),
  })
  .meta({ id: "ObserveResult" });

export const ObserveResponseSchema = wrapResponse(
  ObserveResultSchema,
  "ObserveResponse",
);

// =============================================================================
// Agent Execute
// =============================================================================

export const AgentConfigSchema = z
  .object({
    provider: z // cloud accepts provider: at the top level for legacy reasons, in the future we should remove it
      .enum(["openai", "anthropic", "google", "microsoft", "bedrock"])
      .optional()
      .meta({
        description:
          "AI provider for the agent (legacy, use model: openai/gpt-5-nano instead)",
        example: "openai",
      }),
    model: z.union([ModelConfigSchema, z.string()]).optional().meta({
      description:
        "Model configuration object or model name string (e.g., 'openai/gpt-5-nano')",
    }),
    systemPrompt: z.string().optional().meta({
      description: "Custom system prompt for the agent",
    }),
    cua: z.boolean().optional().meta({
      description:
        "Deprecated. Use mode: 'cua' instead. If both are provided, mode takes precedence.",
      example: true,
    }),
    mode: z.enum(["dom", "hybrid", "cua"]).optional().meta({
      description:
        "Tool mode for the agent (dom, hybrid, cua). If set, overrides cua.",
      example: "cua",
    }),
    executionModel: z.union([ModelConfigSchema, z.string()]).optional().meta({
      description:
        "Model configuration object or model name string (e.g., 'openai/gpt-5-nano') for tool execution (observe/act calls within agent tools). If not specified, inherits from the main model configuration.",
    }),
  })
  .meta({ id: "AgentConfig" });

/** Action taken by the agent during execution */
export const AgentActionSchema = z
  .object({
    type: z.string().meta({
      description: "Type of action taken",
      example: "click",
    }),
    reasoning: z.string().optional().meta({
      description: "Agent's reasoning for taking this action",
    }),
    taskCompleted: z.boolean().optional(),
    action: z.string().optional(),
    timeMs: z.number().optional().meta({
      description: "Time taken for this action in ms",
    }),
    pageText: z.string().optional(),
    pageUrl: z.string().optional(),
    instruction: z.string().optional(),
  })
  .passthrough()
  .meta({ id: "AgentAction" });

/** Token usage statistics for agent execution */
export const AgentUsageSchema = z
  .object({
    input_tokens: z.number().meta({ example: 1500 }),
    output_tokens: z.number().meta({ example: 250 }),
    reasoning_tokens: z.number().optional(),
    cached_input_tokens: z.number().optional(),
    inference_time_ms: z.number().meta({ example: 2500 }),
  })
  .meta({ id: "AgentUsage" });

/** Result data from agent execution */
export const AgentResultDataSchema = z
  .object({
    success: z.boolean().meta({
      description: "Whether the agent completed successfully",
      example: true,
    }),
    message: z.string().meta({
      description: "Summary of what the agent accomplished",
      example: "Successfully logged in and navigated to dashboard",
    }),
    actions: z.array(AgentActionSchema),
    completed: z.boolean().meta({
      description: "Whether the agent finished its task",
      example: true,
    }),
    metadata: z.record(z.string(), z.unknown()).optional(),
    usage: AgentUsageSchema.optional(),
  })
  .meta({ id: "AgentResultData" });

export const AgentCacheEntrySchema = z
  .object({
    cacheKey: z.string().meta({
      description:
        "Opaque cache identifier computed from instruction, URL, options, and config",
    }),
    entry: z.unknown().meta({
      description: "Serialized cache entry that can be written to disk",
    }),
  })
  .meta({ id: "AgentCacheEntry" });

export const AgentExecuteOptionsSchema = z
  .object({
    instruction: z.string().meta({
      description: "Natural language instruction for the agent",
      example:
        "Log in with username 'demo' and password 'test123', then navigate to settings",
    }),
    maxSteps: z.number().optional().meta({
      description: "Maximum number of steps the agent can take",
      example: 20,
    }),
    highlightCursor: z.boolean().optional().meta({
      description: "Whether to visually highlight the cursor during execution",
      example: true,
    }),
    useSearch: z.boolean().optional().meta({
      description:
        "Whether to enable the web search tool powered by Browserbase Search API",
      example: true,
    }),
    toolTimeout: z.number().optional().meta({
      description: "Timeout in milliseconds for each agent tool call",
      example: 30000,
    }),
  })
  .meta({ id: "AgentExecuteOptions" });

export const AgentExecuteRequestSchema = z
  .object({
    agentConfig: AgentConfigSchema,
    executeOptions: AgentExecuteOptionsSchema,
    frameId: z.string().nullish().meta({
      description: "Target frame ID for the agent",
    }),
    streamResponse: z.boolean().optional().meta({
      description: "Whether to stream the response via SSE",
      example: true,
    }),
    shouldCache: z.boolean().optional().meta({
      description:
        "If true, the server captures a cache entry and returns it to the client",
    }),
  })
  .meta({ id: "AgentExecuteRequest" });

export const AgentExecuteResultSchema = z
  .object({
    result: AgentResultDataSchema,
    cacheEntry: AgentCacheEntrySchema.optional(),
  })
  .meta({ id: "AgentExecuteResult" });

export const AgentExecuteResponseSchema = wrapResponse(
  AgentExecuteResultSchema,
  "AgentExecuteResponse",
);

// =============================================================================
// Navigate
// =============================================================================

export const NavigateOptionsSchema = z
  .object({
    referer: z.string().optional().meta({
      description: "Referer header to send with the request",
    }),
    timeout: z.number().optional().meta({
      description: "Timeout in ms for the navigation",
      example: 30000,
    }),
    waitUntil: z
      .enum(["load", "domcontentloaded", "networkidle"])
      .optional()
      .meta({
        description: "When to consider navigation complete",
        example: "networkidle",
      }),
  })
  .optional()
  .meta({ id: "NavigateOptions" });

export const NavigateRequestSchema = z
  .object({
    url: z.string().meta({
      description: "URL to navigate to",
      example: "https://example.com",
    }),
    options: NavigateOptionsSchema,
    frameId: z.string().nullish().meta({
      description: "Target frame ID for the navigation",
    }),
    streamResponse: z.boolean().optional().meta({
      description: "Whether to stream the response via SSE",
      example: true,
    }),
  })
  .meta({ id: "NavigateRequest" });

export const NavigateResultSchema = z
  .object({
    // SerializableResponse from types/private/api.ts - no Zod schema available
    // as it wraps complex devtools-protocol types (Protocol.Network.Response)
    result: z
      .unknown()
      .nullable()
      .meta({
        description: "Navigation response (Playwright Response object or null)",
        override: ({ jsonSchema }: { jsonSchema: Record<string, unknown> }) => {
          jsonSchema["x-stainless-any"] = true;
        },
      }),
    actionId: z.string().optional().meta({
      description: "Action ID for tracking",
    }),
  })
  .meta({ id: "NavigateResult" });

export const NavigateResponseSchema = wrapResponse(
  NavigateResultSchema,
  "NavigateResponse",
);

// =============================================================================
// Replay Metrics
// =============================================================================

/** Token usage for a single action */
export const TokenUsageSchema = z
  .object({
    inputTokens: z.number().optional(),
    outputTokens: z.number().optional(),
    timeMs: z.number().optional(),
    cost: z.number().optional(),
  })
  .meta({ id: "TokenUsage" });

/** Action entry in replay metrics */
export const ReplayActionSchema = z
  .object({
    method: z.string(),
    parameters: z.record(z.string(), z.unknown()),
    result: z.record(z.string(), z.unknown()),
    timestamp: z.number(),
    endTime: z.number().optional(),
    tokenUsage: TokenUsageSchema.optional(),
  })
  .meta({ id: "ReplayAction" });

/** Page entry in replay metrics */
export const ReplayPageSchema = z
  .object({
    url: z.string(),
    timestamp: z.number(),
    duration: z.number(),
    actions: z.array(ReplayActionSchema),
  })
  .meta({ id: "ReplayPage" });

/** Inner result data for replay */
export const ReplayResultSchema = z
  .object({
    pages: z.array(ReplayPageSchema),
    clientLanguage: z.string().optional(),
  })
  .meta({ id: "ReplayResult" });

export const ReplayResponseSchema = wrapResponse(
  ReplayResultSchema,
  "ReplayResponse",
);

// =============================================================================
// SSE Stream Events
// =============================================================================
// These schemas define the Server-Sent Events format for streaming responses.
// Streaming is enabled by setting the `x-stream-response: true` header.

/** Status values for SSE stream events */
export const StreamEventStatusSchema = z
  .enum(["starting", "connected", "running", "finished", "error"])
  .meta({
    id: "StreamEventStatus",
    description: "Current status of the streaming operation",
  });

/** Type discriminator for SSE stream events */
export const StreamEventTypeSchema = z.enum(["system", "log"]).meta({
  id: "StreamEventType",
  description: "Type of stream event - system events or log messages",
});

/** Data payload for system stream events */
export const StreamEventSystemDataSchema = z
  .object({
    status: StreamEventStatusSchema,
    result: z
      .unknown()
      .optional()
      .meta({
        description: "Operation result (present when status is 'finished')",
        override: ({ jsonSchema }: { jsonSchema: Record<string, unknown> }) => {
          jsonSchema["x-stainless-any"] = true;
        },
      }),
    error: z.string().optional().meta({
      description: "Error message (present when status is 'error')",
    }),
  })
  .meta({ id: "StreamEventSystemData" });

/** Data payload for log stream events */
export const StreamEventLogDataSchema = z
  .object({
    status: z.literal("running"),
    message: z.string().meta({
      description: "Log message from the operation",
    }),
  })
  .meta({ id: "StreamEventLogData" });

/**
 * SSE stream event sent during streaming responses.
 *
 * IMPORTANT: Key ordering matters for Stainless SDK generation.
 * The `data` field MUST be serialized first, with `status` as the first key within it.
 * This allows Stainless to use `data_starts_with: '{"data":{"status":"finished"'` for event handling.
 *
 * Expected serialization order: {"data":{"status":...},"type":...,"id":...}
 */
export const StreamEventSchema = z
  .object({
    data: z.union([StreamEventSystemDataSchema, StreamEventLogDataSchema]),
    type: StreamEventTypeSchema,
    id: z.string().uuid().meta({
      description: "Unique identifier for this event",
      example: "c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123",
    }),
  })
  .meta({
    id: "StreamEvent",
    description:
      "Server-Sent Event emitted during streaming responses. Events are sent as `data: <JSON>\\n\\n`. Key order: data (with status first), type, id.",
  });

// =============================================================================
// OpenAPI Components
// =============================================================================
// These objects are exported for use in gen-openapi.ts to configure the spec.

/** OpenAPI security schemes for authentication */
export const openApiSecuritySchemes = {
  BrowserbaseApiKey: {
    type: "apiKey",
    in: "header",
    name: "x-bb-api-key",
    description: "Browserbase API key for authentication",
  },
  BrowserbaseProjectId: {
    type: "apiKey",
    in: "header",
    name: "x-bb-project-id",
    description: "Browserbase project ID",
  },
  ModelApiKey: {
    type: "apiKey",
    in: "header",
    name: "x-model-api-key",
    description: "API key for the AI model provider (OpenAI, Anthropic, etc.)",
  },
} as const;

/** OpenAPI links for session operations (used in SessionStart response) */
export const openApiLinks = {
  SessionAct: {
    operationId: "SessionAct",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "Perform an action on the session",
  },
  SessionExtract: {
    operationId: "SessionExtract",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "Extract data from the session",
  },
  SessionObserve: {
    operationId: "SessionObserve",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "Observe available actions on the session",
  },
  SessionNavigate: {
    operationId: "SessionNavigate",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "Navigate to a URL in the session",
  },
  SessionAgentExecute: {
    operationId: "SessionAgentExecute",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "Execute an agent on the session",
  },
  SessionReplay: {
    operationId: "SessionReplay",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "Replay session metrics",
  },
  SessionEnd: {
    operationId: "SessionEnd",
    parameters: { id: "$response.body#/data/sessionId" },
    description: "End the session and release resources",
  },
} as const;

/** OpenAPI operation metadata for each endpoint */
export const Operations = {
  SessionStart: {
    operationId: "SessionStart",
    summary: "Start a new browser session",
    description:
      "Creates a new browser session with the specified configuration. Returns a session ID used for all subsequent operations.",
  },
  SessionEnd: {
    operationId: "SessionEnd",
    summary: "End a browser session",
    description:
      "Terminates the browser session and releases all associated resources.",
  },
  SessionAct: {
    operationId: "SessionAct",
    summary: "Perform an action",
    description:
      "Executes a browser action using natural language instructions or a predefined Action object.",
  },
  SessionExtract: {
    operationId: "SessionExtract",
    summary: "Extract data from the page",
    description:
      "Extracts structured data from the current page using AI-powered analysis.",
  },
  SessionObserve: {
    operationId: "SessionObserve",
    summary: "Observe available actions",
    description:
      "Identifies and returns available actions on the current page that match the given instruction.",
  },
  SessionNavigate: {
    operationId: "SessionNavigate",
    summary: "Navigate to a URL",
    description: "Navigates the browser to the specified URL.",
  },
  SessionAgentExecute: {
    operationId: "SessionAgentExecute",
    summary: "Execute an AI agent",
    description:
      "Runs an autonomous AI agent that can perform complex multi-step browser tasks.",
  },
  SessionReplay: {
    operationId: "SessionReplay",
    summary: "Replay session metrics",
    description: "Retrieves replay metrics for a session.",
  },
} as const;

// =============================================================================
// Type Exports (inferred from schemas)
// =============================================================================

// Shared types
export type Action = z.infer<typeof ActionSchema>;
export type ModelConfig = z.infer<typeof ModelConfigSchema>;
export type BrowserConfig = z.infer<typeof BrowserConfigSchema>;
export type SessionIdParams = z.infer<typeof SessionIdParamsSchema>;

// Header types
export type SessionHeaders = z.infer<typeof SessionHeadersSchema>;

// Browserbase types
export type BrowserbaseViewport = z.infer<typeof BrowserbaseViewportSchema>;
export type BrowserbaseFingerprintScreen = z.infer<
  typeof BrowserbaseFingerprintScreenSchema
>;
export type BrowserbaseFingerprint = z.infer<
  typeof BrowserbaseFingerprintSchema
>;
export type BrowserbaseContext = z.infer<typeof BrowserbaseContextSchema>;
export type BrowserbaseBrowserSettings = z.infer<
  typeof BrowserbaseBrowserSettingsSchema
>;
export type BrowserbaseProxyGeolocation = z.infer<
  typeof BrowserbaseProxyGeolocationSchema
>;
export type BrowserbaseProxyConfig = z.infer<
  typeof BrowserbaseProxyConfigSchema
>;
export type ExternalProxyConfig = z.infer<typeof ExternalProxyConfigSchema>;
export type BrowserbaseRegion = z.infer<typeof BrowserbaseRegionSchema>;
export type BrowserbaseSessionCreateParams = z.infer<
  typeof BrowserbaseSessionCreateParamsSchema
>;

// Type check: ensure our schema-derived type is assignable to the SDK type
// This will cause a compile error if our schema drifts from the SDK
// eslint-disable-next-line @typescript-eslint/no-unused-vars
type _BrowserbaseSessionCreateParamsCheck =
  BrowserbaseSessionCreateParams extends Browserbase.Sessions.SessionCreateParams
    ? true
    : never;

// /sessions/start
export type SessionStartRequest = z.infer<typeof SessionStartRequestSchema>;
export type SessionStartResult = z.infer<typeof SessionStartResultSchema>;
export type SessionStartResponse = z.infer<typeof SessionStartResponseSchema>;

// /sessions/{id}/end
export type SessionEndResult = z.infer<typeof SessionEndResultSchema>;
export type SessionEndResponse = z.infer<typeof SessionEndResponseSchema>;

// /sessions/{id}/act
export type ActRequest = z.infer<typeof ActRequestSchema>;
export type ActResultData = z.infer<typeof ActResultDataSchema>;
export type ActResult = z.infer<typeof ActResultSchema>;
export type ActResponse = z.infer<typeof ActResponseSchema>;

// /sessions/{id}/extract
export type ExtractRequest = z.infer<typeof ExtractRequestSchema>;
export type ExtractResult = z.infer<typeof ExtractResultSchema>;
export type ExtractResponse = z.infer<typeof ExtractResponseSchema>;

// /sessions/{id}/observe
export type ObserveRequest = z.infer<typeof ObserveRequestSchema>;
export type ObserveResult = z.infer<typeof ObserveResultSchema>;
export type ObserveResponse = z.infer<typeof ObserveResponseSchema>;

// /sessions/{id}/agentExecute
export type AgentAction = z.infer<typeof AgentActionSchema>;
export type AgentUsage = z.infer<typeof AgentUsageSchema>;
export type AgentResultData = z.infer<typeof AgentResultDataSchema>;
export type AgentExecuteRequest = z.infer<typeof AgentExecuteRequestSchema>;
export type AgentExecuteResult = z.infer<typeof AgentExecuteResultSchema>;
export type AgentExecuteResponse = z.infer<typeof AgentExecuteResponseSchema>;

// /sessions/{id}/navigate
export type NavigateRequest = z.infer<typeof NavigateRequestSchema>;
export type NavigateResult = z.infer<typeof NavigateResultSchema>;
export type NavigateResponse = z.infer<typeof NavigateResponseSchema>;

// /sessions/{id}/replay
export type TokenUsage = z.infer<typeof TokenUsageSchema>;
export type ReplayAction = z.infer<typeof ReplayActionSchema>;
export type ReplayPage = z.infer<typeof ReplayPageSchema>;
export type ReplayResult = z.infer<typeof ReplayResultSchema>;
export type ReplayResponse = z.infer<typeof ReplayResponseSchema>;

// SSE Stream Events
export type StreamEventStatus = z.infer<typeof StreamEventStatusSchema>;
export type StreamEventType = z.infer<typeof StreamEventTypeSchema>;
export type StreamEventSystemData = z.infer<typeof StreamEventSystemDataSchema>;
export type StreamEventLogData = z.infer<typeof StreamEventLogDataSchema>;
export type StreamEvent = z.infer<typeof StreamEventSchema>;


================================================
FILE: packages/core/lib/v3/types/public/apiErrors.ts
================================================
export class StagehandAPIError extends Error {
  constructor(message: string) {
    super(message);
    this.name = this.constructor.name;
  }
}

export class StagehandAPIUnauthorizedError extends StagehandAPIError {
  constructor(message?: string) {
    super(message || "Unauthorized request");
  }
}

export class StagehandHttpError extends StagehandAPIError {
  constructor(message: string) {
    super(message);
  }
}

export class StagehandServerError extends StagehandAPIError {
  constructor(message: string) {
    super(message);
  }
}

export class StagehandResponseBodyError extends StagehandAPIError {
  constructor() {
    super("Response body is null");
  }
}

export class StagehandResponseParseError extends StagehandAPIError {
  constructor(message: string) {
    super(message);
  }
}


================================================
FILE: packages/core/lib/v3/types/public/context.ts
================================================
/** A cookie as returned by the browser. */
export interface Cookie {
  name: string;
  value: string;
  domain: string;
  path: string;
  /** Unix time in seconds. -1 means session cookie. */
  expires: number;
  httpOnly: boolean;
  secure: boolean;
  sameSite: "Strict" | "Lax" | "None";
}

/** Parameters for setting a cookie. Provide `url` OR `domain`+`path`, not both. */
export interface CookieParam {
  name: string;
  value: string;
  /** Convenience: if provided, domain/path/secure are derived from this URL. */
  url?: string;
  domain?: string;
  path?: string;
  /** Unix timestamp in seconds. -1 or omitted = session cookie. */
  expires?: number;
  httpOnly?: boolean;
  secure?: boolean;
  sameSite?: "Strict" | "Lax" | "None";
}

/** Filter options for clearing cookies selectively. */
export interface ClearCookieOptions {
  name?: string | RegExp;
  domain?: string | RegExp;
  path?: string | RegExp;
}


================================================
FILE: packages/core/lib/v3/types/public/index.ts
================================================
export * from "./agent.js";
// Export api.ts under namespace to avoid conflicts with methods.ts types
export * as Api from "./api.js";
// Also export BrowserbaseRegion directly for convenience
export type { BrowserbaseRegion } from "./api.js";
export * from "./apiErrors.js";
export * from "./logs.js";
export * from "./methods.js";
export * from "./metrics.js";
export * from "./model.js";
export * from "./options.js";
export * from "./page.js";
export * from "./sdkErrors.js";
export * from "./context.js";
export { AISdkClient } from "../../external_clients/aisdk.js";
export { CustomOpenAIClient } from "../../external_clients/customOpenAI.js";


================================================
FILE: packages/core/lib/v3/types/public/locator.ts
================================================
import { Buffer } from "buffer";

export type MouseButton = "left" | "right" | "middle";

export interface SetInputFilePayload {
  name: string;
  mimeType?: string;
  buffer: ArrayBuffer | Uint8Array | Buffer | string;
  lastModified?: number;
}

export type SetInputFilesArgument =
  | string
  | string[]
  | SetInputFilePayload
  | SetInputFilePayload[];


================================================
FILE: packages/core/lib/v3/types/public/logs.ts
================================================
export type LogLevel = 0 | 1 | 2;

/**
 * Mapping between numeric log levels and their names
 *
 * 0 - error/warn - Critical issues or important warnings
 * 1 - info - Standard information messages
 * 2 - debug - Detailed information for debugging
 */
export const LOG_LEVEL_NAMES: Record<LogLevel, string> = {
  0: "error",
  1: "info",
  2: "debug",
};

export type LogLine = {
  id?: string;
  category?: string;
  message: string;
  level?: LogLevel;
  timestamp?: string;
  auxiliary?: {
    [key: string]: {
      value: string;
      type: "object" | "string" | "html" | "integer" | "float" | "boolean";
    };
  };
};

export type Logger = (logLine: LogLine) => void;


================================================
FILE: packages/core/lib/v3/types/public/methods.ts
================================================
import { Page as PatchrightPage } from "patchright-core";
import { Page as PlaywrightPage } from "playwright-core";
import { Page as PuppeteerPage } from "puppeteer-core";
import { z } from "zod";
import type {
  InferStagehandSchema,
  StagehandZodSchema,
} from "../../zodCompat.js";
import { Page } from "../../understudy/page.js";
import { ModelConfiguration } from "../public/model.js";
import type { Variables } from "./agent.js";

export interface ActOptions {
  model?: ModelConfiguration;
  variables?: Variables;
  timeout?: number;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  /**
   * Override the instance-level serverCache setting for this request.
   * When true, enables server-side caching.
   * When false, disables server-side caching.
   */
  serverCache?: boolean;
}

export interface ActResult {
  success: boolean;
  message: string;
  actionDescription: string;
  actions: Action[];
  cacheStatus?: "HIT" | "MISS";
}

export type ExtractResult<T extends StagehandZodSchema> =
  InferStagehandSchema<T> & {
    cacheStatus?: "HIT" | "MISS";
  };

export interface Action {
  selector: string;
  description: string;
  method?: string;
  arguments?: string[];
}

export interface HistoryEntry {
  method: "act" | "extract" | "observe" | "navigate" | "agent";
  parameters: unknown;
  result: unknown;
  timestamp: string;
}

export interface ExtractOptions {
  model?: ModelConfiguration;
  timeout?: number;
  selector?: string;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  /**
   * Override the instance-level serverCache setting for this request.
   * When true, enables server-side caching.
   * When false, disables server-side caching.
   */
  serverCache?: boolean;
}

export const defaultExtractSchema = z.object({
  extraction: z.string(),
});

export const pageTextSchema = z.object({
  pageText: z.string(),
});

export interface ObserveOptions {
  model?: ModelConfiguration;
  timeout?: number;
  selector?: string;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  /**
   * Override the instance-level serverCache setting for this request.
   * When true, enables server-side caching.
   * When false, disables server-side caching.
   */
  serverCache?: boolean;
}

/**
 * Observe returns an array of candidate actions. The optional `cacheStatus`
 * property is attached when the server responds with a
 * `browserbase-cache-status` header so callers can tell whether the result
 * was served from the server-side cache.
 */
export type ObserveResult = Action[] & { cacheStatus?: "HIT" | "MISS" };

export enum V3FunctionName {
  ACT = "ACT",
  EXTRACT = "EXTRACT",
  OBSERVE = "OBSERVE",
  AGENT = "AGENT",
}


================================================
FILE: packages/core/lib/v3/types/public/metrics.ts
================================================
export interface StagehandMetrics {
  actPromptTokens: number;
  actCompletionTokens: number;
  actReasoningTokens: number;
  actCachedInputTokens: number;
  actInferenceTimeMs: number;
  extractPromptTokens: number;
  extractCompletionTokens: number;
  extractReasoningTokens: number;
  extractCachedInputTokens: number;
  extractInferenceTimeMs: number;
  observePromptTokens: number;
  observeCompletionTokens: number;
  observeReasoningTokens: number;
  observeCachedInputTokens: number;
  observeInferenceTimeMs: number;
  agentPromptTokens: number;
  agentCompletionTokens: number;
  agentReasoningTokens: number;
  agentCachedInputTokens: number;
  agentInferenceTimeMs: number;
  totalPromptTokens: number;
  totalCompletionTokens: number;
  totalReasoningTokens: number;
  totalCachedInputTokens: number;
  totalInferenceTimeMs: number;
}


================================================
FILE: packages/core/lib/v3/types/public/model.ts
================================================
import type { ClientOptions as AnthropicClientOptionsBase } from "@anthropic-ai/sdk";
import type { GoogleVertexProviderSettings as GoogleVertexProviderSettingsBase } from "@ai-sdk/google-vertex";
import type { LanguageModelV2 } from "@ai-sdk/provider";
import type { ClientOptions as OpenAIClientOptionsBase } from "openai";
import type { AgentProviderType } from "./agent.js";

export type OpenAIClientOptions = Pick<
  OpenAIClientOptionsBase,
  "baseURL" | "apiKey"
>;

export type AnthropicClientOptions = Pick<
  AnthropicClientOptionsBase,
  "baseURL" | "apiKey"
>;

export interface GoogleServiceAccountCredentials {
  type?: string;
  project_id?: string;
  private_key_id?: string;
  private_key?: string;
  client_email?: string;
  client_id?: string;
  auth_uri?: string;
  token_uri?: string;
  auth_provider_x509_cert_url?: string;
  client_x509_cert_url?: string;
  universe_domain?: string;
}

export type GoogleVertexProviderSettings = Pick<
  GoogleVertexProviderSettingsBase,
  "project" | "location" | "headers"
> & {
  googleAuthOptions?: {
    credentials?: GoogleServiceAccountCredentials;
  };
};

export type AnthropicJsonSchemaObject = {
  definitions?: {
    MySchema?: {
      properties?: Record<string, unknown>;
      required?: string[];
    };
  };
  properties?: Record<string, unknown>;
  required?: string[];
} & Record<string, unknown>;

export interface LLMTool {
  type: "function";
  name: string;
  description: string;
  parameters: Record<string, unknown>;
}

export type AISDKProvider = (modelName: string) => LanguageModelV2;
// Represents a function that takes options (like apiKey) and returns an AISDKProvider
export type AISDKCustomProvider = (options: ClientOptions) => AISDKProvider;

export type AvailableModel =
  | "gpt-4.1"
  | "gpt-4.1-mini"
  | "gpt-4.1-nano"
  | "o4-mini"
  | "o3"
  | "o3-mini"
  | "o1"
  | "o1-mini"
  | "gpt-4o"
  | "gpt-4o-mini"
  | "gpt-4o-2024-08-06"
  | "gpt-4.5-preview"
  | "o1-preview"
  | "cerebras-llama-3.3-70b"
  | "cerebras-llama-3.1-8b"
  | "groq-llama-3.3-70b-versatile"
  | "groq-llama-3.3-70b-specdec"
  | "gemini-1.5-flash"
  | "gemini-1.5-pro"
  | "gemini-1.5-flash-8b"
  | "gemini-2.0-flash-lite"
  | "gemini-2.0-flash"
  | "gemini-2.5-flash-preview-04-17"
  | "gemini-2.5-pro-preview-03-25"
  | string;

export type ModelProvider =
  | "openai"
  | "anthropic"
  | "cerebras"
  | "groq"
  | "google"
  | "aisdk";

export type ClientOptions = (
  | OpenAIClientOptions
  | AnthropicClientOptions
  | GoogleVertexProviderSettings
) & {
  apiKey?: string;
  provider?: AgentProviderType;
  baseURL?: string;
  /** OpenAI organization ID */
  organization?: string;
  /** Delay between agent actions in ms */
  waitBetweenActions?: number;
  /** Anthropic thinking budget for extended thinking */
  thinkingBudget?: number;
  /** Environment type for CUA agents (browser, mac, windows, ubuntu) */
  environment?: string;
  /** Max images for Microsoft FARA agent */
  maxImages?: number;
  /** Temperature for model inference */
  temperature?: number;
  /** Custom headers sent with every request to the provider */
  headers?: Record<string, string>;
};

export type ModelConfiguration =
  | AvailableModel
  | (ClientOptions & { modelName: AvailableModel });


================================================
FILE: packages/core/lib/v3/types/public/options.ts
================================================
import { z } from "zod";
import { LLMClient } from "../../llm/LLMClient.js";
import { ModelConfiguration } from "./model.js";
import { LogLine } from "./logs.js";
import {
  type BrowserbaseSessionCreateParams,
  LocalBrowserLaunchOptionsSchema,
} from "./api.js";

export type V3Env = "LOCAL" | "BROWSERBASE";

// Re-export for backwards compatibility (camelCase alias)
export const localBrowserLaunchOptionsSchema = LocalBrowserLaunchOptionsSchema;

export type LocalBrowserLaunchOptions = z.infer<
  typeof LocalBrowserLaunchOptionsSchema
>;

/** Constructor options for V3 */
export interface V3Options {
  env: V3Env;
  /**
   * Optional external session identifier to use for flow logging/event storage.
   * When omitted, Stagehand falls back to its internal instance id.
   * This currently ends up 1:1 with the Browserbase session id when one exists,
   * but callers should not rely on that remaining a permanent invariant.
   */
  sessionId?: string;
  // Browserbase (required when env = "BROWSERBASE")
  apiKey?: string;
  projectId?: string;
  /**
   * Optional: fine-tune Browserbase session creation or resume an existing session.
   */
  browserbaseSessionCreateParams?: BrowserbaseSessionCreateParams;
  browserbaseSessionID?: string;
  /**
   * Controls browser keepalive behavior. When set, it overrides any value in
   * browserbaseSessionCreateParams.keepAlive.
   */
  keepAlive?: boolean;

  // Local Chromium (optional)
  localBrowserLaunchOptions?: LocalBrowserLaunchOptions;

  model?: ModelConfiguration;
  llmClient?: LLMClient; // allow user to pass their own
  systemPrompt?: string;
  logInferenceToFile?: boolean;
  experimental?: boolean;
  verbose?: 0 | 1 | 2;
  selfHeal?: boolean;
  // V2 compatibility fields - only included because the server imports this type and supports V2
  waitForCaptchaSolves?: boolean;
  actTimeoutMs?: number;
  /** Disable pino logging backend (useful for tests or minimal environments). */
  disablePino?: boolean;
  /** Optional external logger hook for integrating with host apps. */
  logger?: (line: LogLine) => void;
  /** Directory used to persist cached actions for act(). */
  cacheDir?: string;
  domSettleTimeout?: number;
  disableAPI?: boolean;
  /**
   * When true, enables server-side caching for API requests.
   * When false, disables server-side caching.
   * Defaults to true (caching enabled).
   * Can be overridden per-method in act(), extract(), and observe() options.
   */
  serverCache?: boolean;
}


================================================
FILE: packages/core/lib/v3/types/public/page.ts
================================================
import { Page } from "../../understudy/page.js";
import { Page as PlaywrightPage } from "playwright-core";
import { Page as PatchrightPage } from "patchright-core";
import { Page as PuppeteerPage } from "puppeteer-core";

export type { PlaywrightPage, PatchrightPage, PuppeteerPage, Page };
export type AnyPage = PlaywrightPage | PuppeteerPage | PatchrightPage | Page;

export { ConsoleMessage } from "../../understudy/consoleMessage.js";
export type { ConsoleListener } from "../../understudy/consoleMessage.js";

export type LoadState = "load" | "domcontentloaded" | "networkidle";
export { Response } from "../../understudy/response.js";

export type SnapshotResult = {
  formattedTree: string;
  xpathMap: Record<string, string>;
  urlMap: Record<string, string>;
};

export type PageSnapshotOptions = {
  includeIframes?: boolean;
};


================================================
FILE: packages/core/lib/v3/types/public/screenshotTypes.ts
================================================
import type { Locator } from "../../understudy/locator.js";

export type ScreenshotAnimationsOption = "disabled" | "allow";
export type ScreenshotCaretOption = "hide" | "initial";
export type ScreenshotScaleOption = "css" | "device";

export interface ScreenshotClip {
  x: number;
  y: number;
  width: number;
  height: number;
}

export interface ScreenshotOptions {
  animations?: ScreenshotAnimationsOption;
  caret?: ScreenshotCaretOption;
  clip?: ScreenshotClip;
  fullPage?: boolean;
  mask?: Locator[];
  maskColor?: string;
  omitBackground?: boolean;
  path?: string;
  quality?: number;
  scale?: ScreenshotScaleOption;
  style?: string;
  timeout?: number;
  type?: "png" | "jpeg";
}


================================================
FILE: packages/core/lib/v3/types/public/sdkErrors.ts
================================================
import { ZodError } from "zod";
// Avoid .js extension so bundlers resolve TS source
import { STAGEHAND_VERSION } from "../../../version.js";

export class StagehandError extends Error {
  public readonly cause?: unknown;

  constructor(message: string, cause?: unknown) {
    super(message);
    this.name = this.constructor.name;
    if (cause !== undefined) {
      this.cause = cause;
    }
  }
}

export class StagehandDefaultError extends StagehandError {
  constructor(error?: unknown) {
    if (error instanceof Error || error instanceof StagehandError) {
      super(
        `\nHey! We're sorry you ran into an error. \nStagehand version: ${STAGEHAND_VERSION} \nIf you need help, please open a Github issue or reach out to us on Discord: https://stagehand.dev/discord\n\nFull error:\n${error.message}`,
      );
    }
  }
}

export class StagehandEnvironmentError extends StagehandError {
  constructor(
    currentEnvironment: string,
    requiredEnvironment: string,
    feature: string,
  ) {
    super(
      `You seem to be setting the current environment to ${currentEnvironment}.` +
        `Ensure the environment is set to ${requiredEnvironment} if you want to use ${feature}.`,
    );
  }
}

export class MissingEnvironmentVariableError extends StagehandError {
  constructor(missingEnvironmentVariable: string, feature: string) {
    super(
      `${missingEnvironmentVariable} is required to use ${feature}.` +
        `Please set ${missingEnvironmentVariable} in your environment.`,
    );
  }
}

export class UnsupportedModelError extends StagehandError {
  constructor(supportedModels: string[], feature?: string) {
    const message = feature
      ? `${feature} requires a valid model.`
      : `Unsupported model.`;

    const guidance =
      `\n\nPlease use the provider/model format (e.g., "openai/gpt-4o", "anthropic/claude-sonnet-4-5", "google/gemini-3-flash-preview").` +
      `\n\nFor a complete list of supported models and providers, see: https://docs.stagehand.dev/v3/configuration/models#configuration-setup`;

    super(`${message}${guidance}`);
  }
}

export class UnsupportedModelProviderError extends StagehandError {
  constructor(supportedProviders: string[], feature?: string) {
    super(
      feature
        ? `${feature} requires one of the following model providers: ${supportedProviders}`
        : `please use one of the supported model providers: ${supportedProviders}`,
    );
  }
}

export class UnsupportedAISDKModelProviderError extends StagehandError {
  constructor(provider: string, supportedProviders: string[]) {
    super(
      `${provider} is not currently supported for aiSDK. please use one of the supported model providers: ${supportedProviders}`,
    );
  }
}

export class InvalidAISDKModelFormatError extends StagehandError {
  constructor(modelName: string) {
    super(
      `${modelName} does not follow correct format for specifying aiSDK models. Please define your model as 'provider/model-name'. For example: \`model: 'openai/gpt-4o-mini'\``,
    );
  }
}

export class StagehandNotInitializedError extends StagehandError {
  constructor(prop: string) {
    super(
      `You seem to be calling \`${prop}\` on a page in an uninitialized \`Stagehand\` object. ` +
        `Ensure you are running \`await stagehand.init()\` on the Stagehand object before ` +
        `referencing the \`page\` object.`,
    );
  }
}

export class BrowserbaseSessionNotFoundError extends StagehandError {
  constructor() {
    super("No Browserbase session ID found");
  }
}

export class CaptchaTimeoutError extends StagehandError {
  constructor() {
    super("Captcha timeout");
  }
}

export class MissingLLMConfigurationError extends StagehandError {
  constructor() {
    super(
      "No LLM API key or LLM Client configured. An LLM API key or a custom LLM Client " +
        "is required to use act, extract, or observe.",
    );
  }
}

export class HandlerNotInitializedError extends StagehandError {
  constructor(handlerType: string) {
    super(`${handlerType} handler not initialized`);
  }
}

export class StagehandInvalidArgumentError extends StagehandError {
  constructor(message: string) {
    super(`InvalidArgumentError: ${message}`);
  }
}

export class CookieValidationError extends StagehandError {
  constructor(message: string) {
    super(message);
  }
}

export class CookieSetError extends StagehandError {
  constructor(message: string) {
    super(message);
  }
}

export class StagehandElementNotFoundError extends StagehandError {
  constructor(xpaths: string[]) {
    super(`Could not find an element for the given xPath(s): ${xpaths}`);
  }
}

export class AgentScreenshotProviderError extends StagehandError {
  constructor(message: string) {
    super(`ScreenshotProviderError: ${message}`);
  }
}

export class StagehandMissingArgumentError extends StagehandError {
  constructor(message: string) {
    super(`MissingArgumentError: ${message}`);
  }
}

export class CreateChatCompletionResponseError extends StagehandError {
  constructor(message: string) {
    super(`CreateChatCompletionResponseError: ${message}`);
  }
}

export class StagehandEvalError extends StagehandError {
  constructor(message: string) {
    super(`StagehandEvalError: ${message}`);
  }
}

export class StagehandDomProcessError extends StagehandError {
  constructor(message: string) {
    super(`Error Processing Dom: ${message}`);
  }
}

export class StagehandLocatorError extends StagehandError {
  constructor(action: string, selector: string, message: string) {
    super(
      `Error ${action} Element with selector: ${selector} Reason: ${message}`,
    );
  }
}

export class StagehandClickError extends StagehandError {
  constructor(message: string, selector: string) {
    super(
      `Error Clicking Element with selector: ${selector} Reason: ${message}`,
    );
  }
}

export class LLMResponseError extends StagehandError {
  constructor(primitive: string, message: string) {
    super(`${primitive} LLM response error: ${message}`);
  }
}

export class StagehandIframeError extends StagehandError {
  constructor(frameUrl: string, message: string) {
    super(
      `Unable to resolve frameId for iframe with URL: ${frameUrl} Full error: ${message}`,
    );
  }
}

export class ContentFrameNotFoundError extends StagehandError {
  constructor(selector: string) {
    super(`Unable to obtain a content frame for selector: ${selector}`);
  }
}

export class XPathResolutionError extends StagehandError {
  constructor(xpath: string) {
    super(`XPath "${xpath}" does not resolve in the current page or frames`);
  }
}

export class ExperimentalApiConflictError extends StagehandError {
  constructor() {
    super(
      "`experimental` mode cannot be used together with the Stagehand API. " +
        "To use experimental features, set experimental: true and disableAPI: true in the stagehand constructor. " +
        "To use the Stagehand API, set experimental: false and disableAPI: false (or omit it) in the stagehand constructor.",
    );
  }
}

export class ExperimentalNotConfiguredError extends StagehandError {
  constructor(featureName: string) {
    super(`Feature "${featureName}" is an experimental feature, and cannot be configured when disableAPI: false.
    Please set experimental: true and disableAPI: true in the stagehand constructor to use this feature.
    If you wish to use the Stagehand API, please ensure ${featureName} is not defined in your function call,
    and set experimental: false, disableAPI: false (or omit it) in the Stagehand constructor.`);
  }
}

export class CuaModelRequiredError extends StagehandError {
  constructor(availableModels: readonly string[]) {
    super(
      `To use the computer use agent (CUA), please provide a CUA model in the agent constructor or stagehand config. ` +
        `Try one of our supported CUA models: ${availableModels.join(", ")}`,
    );
  }
}

export class ZodSchemaValidationError extends Error {
  constructor(
    public readonly received: unknown,
    public readonly issues: ReturnType<ZodError["format"]>,
  ) {
    super(`Zod schema validation failed

— Received —
${JSON.stringify(received, null, 2)}

— Issues —
${JSON.stringify(issues, null, 2)}`);
    this.name = "ZodSchemaValidationError";
  }
}

export class StagehandInitError extends StagehandError {
  constructor(message: string) {
    super(message);
  }
}

export class MCPConnectionError extends StagehandError {
  public readonly serverUrl: string;
  public readonly originalError: unknown;

  constructor(serverUrl: string, originalError: unknown) {
    const errorMessage =
      originalError instanceof Error
        ? originalError.message
        : String(originalError);

    super(
      `Failed to connect to MCP server at "${serverUrl}". ${errorMessage}. ` +
        `Please verify the server URL is correct and the server is running.`,
    );

    this.serverUrl = serverUrl;
    this.originalError = originalError;
  }
}

export class StagehandShadowRootMissingError extends StagehandError {
  constructor(detail?: string) {
    super(
      `No shadow root present on the resolved host` +
        (detail ? `: ${detail}` : ""),
    );
  }
}

export class StagehandShadowSegmentEmptyError extends StagehandError {
  constructor() {
    super(`Empty selector segment after shadow-DOM hop ("//")`);
  }
}

export class StagehandShadowSegmentNotFoundError extends StagehandError {
  constructor(segment: string, hint?: string) {
    super(
      `Shadow segment '${segment}' matched no element inside shadow root` +
        (hint ? ` ${hint}` : ""),
    );
  }
}

export class ElementNotVisibleError extends StagehandError {
  constructor(selector: string) {
    super(`Element not visible (no box model): ${selector}`);
  }
}

export class ResponseBodyError extends StagehandError {
  constructor(message: string) {
    super(`Failed to retrieve response body: ${message}`);
  }
}

export class ResponseParseError extends StagehandError {
  constructor(message: string) {
    super(`Failed to parse response: ${message}`);
  }
}

export class TimeoutError extends StagehandError {
  constructor(operation: string, timeoutMs: number) {
    super(`${operation} timed out after ${timeoutMs}ms`);
  }
}

export class ActTimeoutError extends TimeoutError {
  constructor(timeoutMs: number) {
    super("act()", timeoutMs);
    this.name = "ActTimeoutError";
  }
}

export class ExtractTimeoutError extends TimeoutError {
  constructor(timeoutMs: number) {
    super("extract()", timeoutMs);
    this.name = "ExtractTimeoutError";
  }
}

export class ObserveTimeoutError extends TimeoutError {
  constructor(timeoutMs: number) {
    super("observe()", timeoutMs);
    this.name = "ObserveTimeoutError";
  }
}

export class PageNotFoundError extends StagehandError {
  constructor(identifier: string) {
    super(`No Page found for ${identifier}`);
  }
}

export class ConnectionTimeoutError extends StagehandError {
  constructor(message: string) {
    super(`Connection timeout: ${message}`);
  }
}

export class StreamingCallbacksInNonStreamingModeError extends StagehandError {
  public readonly invalidCallbacks: string[];

  constructor(invalidCallbacks: string[]) {
    super(
      `Streaming-only callback(s) "${invalidCallbacks.join('", "')}" cannot be used in non-streaming mode. ` +
        `Set 'stream: true' in AgentConfig to use these callbacks.`,
    );
    this.invalidCallbacks = invalidCallbacks;
  }
}

export class AgentAbortError extends StagehandError {
  public readonly reason: string;

  constructor(reason?: string) {
    const message = reason
      ? `Agent execution was aborted: ${reason}`
      : "Agent execution was aborted";
    super(message);
    this.reason = reason || "aborted";
  }
}

export class StagehandClosedError extends StagehandError {
  constructor() {
    super("Stagehand session was closed");
  }
}

export class CdpConnectionClosedError extends StagehandError {
  constructor(reason: string) {
    super(`CDP connection closed: ${reason}`);
  }
}

export class StagehandSetExtraHTTPHeadersError extends StagehandError {
  public readonly failures: string[];

  constructor(failures: string[]) {
    super(
      `setExtraHTTPHeaders failed for ${failures.length} session(s): ${failures.join(", ")}`,
    );
    this.failures = failures;
  }
}

export class StagehandSnapshotError extends StagehandError {
  constructor(cause?: unknown) {
    const suffix =
      cause instanceof Error
        ? `: ${cause.message}`
        : cause
          ? `: ${String(cause)}`
          : "";
    super(`error taking snapshot${suffix}`, cause);
  }
}

export class UnderstudyCommandException extends StagehandError {
  constructor(message: string, cause?: unknown) {
    super(message, cause);
    this.name = "UnderstudyCommandException";
  }
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/a11yTree.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "../../cdp.js";
import type {
  A11yNode,
  A11yOptions,
  AccessibilityTreeResult,
} from "../../../types/private/snapshot.js";
import {
  resolveObjectIdForCss,
  resolveObjectIdForXPath,
} from "./focusSelectors.js";
import { formatTreeLine, normaliseSpaces } from "./treeFormatUtils.js";

/**
 * Fetch and prune the accessibility tree for a frame, optionally scoping the
 * output to a selector root for faster targeted snapshots.
 */
export async function a11yForFrame(
  session: CDPSessionLike,
  frameId: string | undefined,
  opts: A11yOptions,
): Promise<AccessibilityTreeResult> {
  await session.send("Accessibility.enable").catch(() => {});
  await session.send("Runtime.enable").catch(() => {});
  await session.send("DOM.enable").catch(() => {});

  let nodes: Protocol.Accessibility.AXNode[] = [];
  try {
    const params = frameId ? ({ frameId } as Record<string, unknown>) : {};
    ({ nodes } = await session.send<{
      nodes: Protocol.Accessibility.AXNode[];
    }>("Accessibility.getFullAXTree", params));
  } catch (e) {
    const msg = String((e as Error)?.message ?? e ?? "");
    const isFrameScopeError =
      msg.includes("Frame with the given") ||
      msg.includes("does not belong to the target") ||
      msg.includes("is not found");
    if (!isFrameScopeError || !frameId) throw e;
    ({ nodes } = await session.send<{
      nodes: Protocol.Accessibility.AXNode[];
    }>("Accessibility.getFullAXTree"));
  }

  const urlMap: Record<string, string> = {};
  for (const n of nodes) {
    const be = n.backendDOMNodeId;
    if (typeof be !== "number") continue;
    const url = extractUrlFromAXNode(n);
    if (!url) continue;
    const enc = opts.encode(be);
    urlMap[enc] = url;
  }

  let scopeApplied = false;
  const nodesForOutline = await (async () => {
    const sel = opts.focusSelector?.trim();
    if (!sel) return nodes;
    try {
      const looksLikeXPath = /^xpath=/i.test(sel) || sel.startsWith("/");
      const objectId = looksLikeXPath
        ? await resolveObjectIdForXPath(session, sel, frameId)
        : await resolveObjectIdForCss(session, sel, frameId);
      if (!objectId) return nodes;
      const desc = await session.send<{ node?: { backendNodeId?: number } }>(
        "DOM.describeNode",
        { objectId },
      );
      const be = desc.node?.backendNodeId;
      if (typeof be !== "number") return nodes;
      const target = nodes.find((n) => n.backendDOMNodeId === be);
      if (!target) return nodes;
      scopeApplied = true;
      const keep = new Set<string>([target.nodeId]);
      const queue: Protocol.Accessibility.AXNode[] = [target];
      while (queue.length) {
        const cur = queue.shift()!;
        for (const id of cur.childIds ?? []) {
          if (keep.has(id)) continue;
          keep.add(id);
          const child = nodes.find((n) => n.nodeId === id);
          if (child) queue.push(child);
        }
      }
      return nodes
        .filter((n) => keep.has(n.nodeId))
        .map((n) =>
          n.nodeId === target.nodeId ? { ...n, parentId: undefined } : n,
        );
    } catch {
      return nodes;
    }
  })();

  const decorated = decorateRoles(nodesForOutline, opts);
  const { tree } = await buildHierarchicalTree(decorated, opts);

  const simplified = tree.map((n) => formatTreeLine(n)).join("\n");
  return { outline: simplified.trimEnd(), urlMap, scopeApplied };
}

export function decorateRoles(
  nodes: Protocol.Accessibility.AXNode[],
  opts: A11yOptions,
): A11yNode[] {
  const asRole = (n: Protocol.Accessibility.AXNode) =>
    String(n.role?.value ?? "");

  return nodes.map((n) => {
    let encodedId: string | undefined;
    if (typeof n.backendDOMNodeId === "number") {
      try {
        encodedId = opts.encode(n.backendDOMNodeId);
      } catch {
        //
      }
    }

    let role = asRole(n);

    const domIsScrollable = encodedId
      ? opts.scrollableMap[encodedId] === true
      : false;
    const tag = encodedId ? opts.tagNameMap[encodedId] : undefined;
    const isHtmlElement = tag === "html";
    if ((domIsScrollable || isHtmlElement) && tag !== "#document") {
      const tagLabel = tag && tag.startsWith("#") ? tag.slice(1) : tag;
      role = tagLabel
        ? `scrollable, ${tagLabel}`
        : `scrollable${role ? `, ${role}` : ""}`;
    }

    return {
      role,
      name: n.name?.value,
      description: n.description?.value,
      value: n.value?.value,
      nodeId: n.nodeId,
      backendDOMNodeId: n.backendDOMNodeId,
      parentId: n.parentId,
      childIds: n.childIds,
      encodedId,
    };
  });
}

export async function buildHierarchicalTree(
  nodes: A11yNode[],
  opts: A11yOptions,
): Promise<{ tree: A11yNode[] }> {
  const nodeMap = new Map<string, A11yNode>();

  for (const n of nodes) {
    const keep =
      !!(n.name && n.name.trim()) ||
      !!(n.childIds && n.childIds.length) ||
      !isStructural(n.role);
    if (!keep) continue;
    nodeMap.set(n.nodeId, { ...n });
  }

  for (const n of nodes) {
    if (!n.parentId) continue;
    const parent = nodeMap.get(n.parentId);
    const cur = nodeMap.get(n.nodeId);
    if (parent && cur) (parent.children ??= []).push(cur);
  }

  const roots = nodes
    .filter((n) => !n.parentId && nodeMap.has(n.nodeId))
    .map((n) => nodeMap.get(n.nodeId)!) as A11yNode[];

  const cleaned = (await Promise.all(roots.map(pruneStructuralSafe))).filter(
    Boolean,
  ) as A11yNode[];

  return { tree: cleaned };

  async function pruneStructuralSafe(node: A11yNode): Promise<A11yNode | null> {
    if (+node.nodeId < 0) return null;

    const children = node.children ?? [];
    if (!children.length) {
      return isStructural(node.role) ? null : node;
    }

    const cleanedKids = (
      await Promise.all(children.map(pruneStructuralSafe))
    ).filter(Boolean) as A11yNode[];

    const prunedStatic = removeRedundantStaticTextChildren(node, cleanedKids);

    if (isStructural(node.role)) {
      if (prunedStatic.length === 1) return prunedStatic[0]!;
      if (prunedStatic.length === 0) return null;
    }

    let newRole = node.role;
    if ((newRole === "generic" || newRole === "none") && node.encodedId) {
      const tagName = opts.tagNameMap[node.encodedId];
      if (tagName) newRole = tagName;
    }

    if (newRole === "combobox" && node.encodedId) {
      const tagName = opts.tagNameMap[node.encodedId];
      if (tagName === "select") newRole = "select";
    }

    return { ...node, role: newRole, children: prunedStatic };
  }
}

export function isStructural(role: string): boolean {
  const r = role?.toLowerCase();
  return r === "generic" || r === "none" || r === "inlinetextbox";
}

export function extractUrlFromAXNode(
  ax: Protocol.Accessibility.AXNode,
): string | undefined {
  const props = ax.properties ?? [];
  const urlProp = props.find((p) => p.name === "url");
  const value = urlProp?.value?.value;
  return typeof value === "string" && value.trim() ? value.trim() : undefined;
}

export function removeRedundantStaticTextChildren(
  parent: A11yNode,
  children: A11yNode[],
): A11yNode[] {
  if (!parent.name) return children;
  const parentNorm = normaliseSpaces(parent.name).trim();
  let combined = "";
  for (const c of children) {
    if (c.role === "StaticText" && c.name) {
      combined += normaliseSpaces(c.name).trim();
    }
  }
  if (combined === parentNorm) {
    return children.filter((c) => c.role !== "StaticText");
  }
  return children;
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/activeElement.ts
================================================
import type { Protocol } from "devtools-protocol";
import { Page } from "../../page.js";
import { executionContexts } from "../../executionContextRegistry.js";
import { buildA11yInvocation } from "../../a11yInvocation.js";
import { a11yScriptSources } from "../../../dom/build/a11yScripts.generated.js";
import {
  absoluteXPathForBackendNode,
  normalizeXPath,
  prefixXPath,
} from "./xpathUtils.js";

/**
 * Compute the absolute XPath for the currently focused element.
 * - Detects which frame has focus via document.hasFocus().
 * - Finds the deepest activeElement (dives into shadow DOM).
 * - Builds an absolute, cross-frame XPath by prefixing iframe hosts.
 */
export async function computeActiveElementXpath(
  page: Page,
): Promise<string | null> {
  const tree = page.getFullFrameTree();
  const parentByFrame = new Map<string, string | null>();
  (function index(n: Protocol.Page.FrameTree, parent: string | null) {
    parentByFrame.set(n.frame.id, parent);
    for (const c of n.childFrames ?? []) index(c, n.frame.id);
  })(tree, null);

  const frames = page.listAllFrameIds();
  let focusedFrameId: string | null = null;
  for (const fid of frames) {
    const sess = page.getSessionForFrame(fid);
    try {
      await sess.send("Runtime.enable").catch(() => {});
      const ctxId = await executionContexts
        .waitForMainWorld(sess, fid, 1000)
        .catch(() => {});
      const hasFocusExpr = buildA11yInvocation("documentHasFocusStrict", []);
      const evalParams = ctxId
        ? {
            contextId: ctxId,
            expression: hasFocusExpr,
            returnByValue: true,
          }
        : { expression: hasFocusExpr, returnByValue: true };
      const { result } = await sess.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        evalParams,
      );
      if (result?.value === true) {
        focusedFrameId = fid;
        break;
      }
    } catch {
      //
    }
  }
  if (!focusedFrameId) focusedFrameId = page.mainFrameId();
  const focusedSession = page.getSessionForFrame(focusedFrameId);

  let objectId: string | undefined;
  try {
    await focusedSession.send("Runtime.enable").catch(() => {});
    const ctxId = await executionContexts
      .waitForMainWorld(focusedSession, focusedFrameId, 1000)
      .catch(() => {});
    const activeExpr = buildA11yInvocation("resolveDeepActiveElement", []);
    const evalParams = ctxId
      ? {
          contextId: ctxId,
          expression: activeExpr,
          returnByValue: false,
        }
      : { expression: activeExpr, returnByValue: false };
    const { result } =
      await focusedSession.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        evalParams,
      );
    objectId = result?.objectId as string | undefined;
  } catch {
    objectId = undefined;
  }
  if (!objectId) return null;

  const leafXPath = await (async () => {
    try {
      const { result } = await focusedSession.send<{
        result: { value?: string };
      }>("Runtime.callFunctionOn", {
        objectId,
        functionDeclaration: a11yScriptSources.nodeToAbsoluteXPath,
        returnByValue: true,
      });
      try {
        await focusedSession.send("Runtime.releaseObject", { objectId });
      } catch {
        //
      }
      const xp = result?.value || "";
      return typeof xp === "string" && xp ? xp : null;
    } catch {
      try {
        await focusedSession.send("Runtime.releaseObject", { objectId });
      } catch {
        //
      }
      return null;
    }
  })();

  if (!leafXPath) return null;

  let prefix = "";
  let cur: string | null | undefined = focusedFrameId;
  while (cur) {
    const parent = parentByFrame.get(cur) ?? null;
    if (!parent) break;
    const parentSess = page.getSessionForFrame(parent);
    try {
      const { backendNodeId } = await parentSess.send<{
        backendNodeId?: number;
      }>("DOM.getFrameOwner", { frameId: cur });
      if (typeof backendNodeId === "number") {
        const xp = await absoluteXPathForBackendNode(parentSess, backendNodeId);
        if (xp) prefix = prefix ? prefixXPath(prefix, xp) : normalizeXPath(xp);
      }
    } catch {
      //
    }
    cur = parent;
  }

  return prefix ? prefixXPath(prefix, leafXPath) : normalizeXPath(leafXPath);
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/capture.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "../../cdp.js";
import { Page } from "../../page.js";
import { v3Logger } from "../../../logger.js";
import type {
  FrameContext,
  FrameDomMaps,
  FrameParentIndex,
  HybridSnapshot,
  SnapshotOptions,
  SessionDomIndex,
} from "../../../types/private/index.js";
import { a11yForFrame } from "./a11yTree.js";
import {
  resolveCssFocusFrameAndTail,
  resolveFocusFrameAndTail,
} from "./focusSelectors.js";
import {
  buildSessionDomIndex,
  domMapsForSession,
  relativizeXPath,
} from "./domTree.js";
import { injectSubtrees } from "./treeFormatUtils.js";
import { ownerSession, parentSession } from "./sessions.js";
import { normalizeXPath, prefixXPath } from "./xpathUtils.js";

/**
 * Capture a hybrid DOM + Accessibility snapshot for the provided page.
 *
 * Flow overview:
 * 1. (Optional) Scope directly to a requested selector. We walk iframe hops to
 *    find the owning frame, build just that frame’s DOM + AX tree, and bail out
 *    early when the subtree satisfies the caller.
 * 2. Build DOM indexes for every unique CDP session. DOM.getDocument is called
 *    once per session and hydrated so per-frame slices can share the result.
 * 3. Slice each frame’s DOM data from its session index and fetch its AX tree.
 *    This yields relative XPath/tag/url maps for the document rooted at that frame.
 * 4. Walk the frame tree to compute absolute iframe prefixes. Every child frame
 *    needs the XPath of the iframe element that hosts it so we can prefix maps.
 * 5. Merge all per-frame results into global combined maps and stitch the text
 *    outline. The final payload mirrors the legacy shape but is built in layers.
 *
 * Each numbered block below references the step above for easier debugging.
 */
export async function captureHybridSnapshot(
  page: Page,
  options?: SnapshotOptions,
): Promise<HybridSnapshot> {
  const pierce = options?.pierceShadow ?? true;
  const includeIframes = options?.includeIframes !== false;

  const context = buildFrameContext(page);

  const scopedSnapshot = await tryScopedSnapshot(
    page,
    options,
    context,
    pierce,
  );
  if (scopedSnapshot) return scopedSnapshot;

  const framesInScope = includeIframes ? [...context.frames] : [context.rootId];
  if (!framesInScope.includes(context.rootId)) {
    framesInScope.unshift(context.rootId);
  }

  const sessionToIndex = await buildSessionIndexes(page, framesInScope, pierce);
  const { perFrameMaps, perFrameOutlines } = await collectPerFrameMaps(
    page,
    context,
    sessionToIndex,
    options,
    pierce,
    framesInScope,
  );
  const { absPrefix, iframeHostEncByChild } = await computeFramePrefixes(
    page,
    context,
    perFrameMaps,
    framesInScope,
  );

  return mergeFramesIntoSnapshot(
    context,
    perFrameMaps,
    perFrameOutlines,
    absPrefix,
    iframeHostEncByChild,
    framesInScope,
  );
}

/**
 * Snapshot the current frame tree so downstream helpers have consistent topology
 * without re-querying CDP. The map is intentionally shallow (frameId → parentId)
 * so it is serializable/testable without holding on to CDP handles.
 */
export function buildFrameContext(page: Page): FrameContext {
  const rootId = page.mainFrameId();
  const frameTree = page.asProtocolFrameTree(rootId);
  const parentByFrame: FrameParentIndex = new Map();
  (function index(n: Protocol.Page.FrameTree, parent: string | null) {
    parentByFrame.set(n.frame.id, parent);
    for (const c of n.childFrames ?? []) index(c, n.frame.id);
  })(frameTree, null);
  const frames = page.listAllFrameIds();
  return { rootId, parentByFrame, frames };
}

/**
 * Step 1 – scoped snapshot fast-path. If a selector is provided we try to:
 *  1) Resolve the selector (XPath or CSS) across iframes.
 *  2) Build DOM + AX data only for the owning frame.
 *  3) Bail out early when the selector's subtree satisfies the request.
 *
 * Returns `null` when scoping fails (e.g., selector miss) so the caller can
 * fall back to the full multi-frame snapshot.
 */
export async function tryScopedSnapshot(
  page: Page,
  options: SnapshotOptions | undefined,
  context: FrameContext,
  pierce: boolean,
): Promise<HybridSnapshot | null> {
  const requestedFocus = options?.focusSelector?.trim();
  if (!requestedFocus) return null;

  const logScopeFallback = () => {
    v3Logger({
      message: `Unable to narrow scope with selector. Falling back to using full DOM`,
      level: 1,
      auxiliary: {
        arguments: {
          value: `selector: ${options?.focusSelector?.trim()}`,
          type: "string",
        },
      },
    });
  };

  try {
    let targetFrameId: string;
    let tailSelector: string | undefined;
    let absPrefix: string | undefined;

    const looksLikeXPath =
      /^xpath=/i.test(requestedFocus) || requestedFocus.startsWith("/");
    if (looksLikeXPath) {
      const focus = normalizeXPath(requestedFocus);
      const hit = await resolveFocusFrameAndTail(
        page,
        focus,
        context.parentByFrame,
        context.rootId,
      );
      targetFrameId = hit.targetFrameId;
      tailSelector = hit.tailXPath || undefined;
      absPrefix = hit.absPrefix;
    } else {
      const cssHit = await resolveCssFocusFrameAndTail(
        page,
        requestedFocus,
        context.parentByFrame,
        context.rootId,
      );
      targetFrameId = cssHit.targetFrameId;
      tailSelector = cssHit.tailSelector || undefined;
      absPrefix = cssHit.absPrefix;
    }

    const owningSess = ownerSession(page, targetFrameId);
    const parentId = context.parentByFrame.get(targetFrameId);
    const sameSessionAsParent =
      !!parentId &&
      ownerSession(page, parentId) === ownerSession(page, targetFrameId);
    const { tagNameMap, xpathMap, scrollableMap } = await domMapsForSession(
      owningSess,
      targetFrameId,
      pierce,
      (fid, be) => `${page.getOrdinal(fid)}-${be}`,
      sameSessionAsParent,
    );

    const { outline, urlMap, scopeApplied } = await a11yForFrame(
      owningSess,
      targetFrameId,
      {
        focusSelector: tailSelector || undefined,
        tagNameMap,
        experimental: options?.experimental ?? false,
        scrollableMap,
        encode: (backendNodeId) =>
          `${page.getOrdinal(targetFrameId)}-${backendNodeId}`,
      },
    );

    const scopedXpathMap: Record<string, string> = {};
    const abs = absPrefix ?? "";
    const isRoot = !abs || abs === "/";
    if (isRoot) {
      Object.assign(scopedXpathMap, xpathMap);
    } else {
      // Prefix relative XPaths so the scoped result matches the global encoding.
      for (const [encId, xp] of Object.entries(xpathMap)) {
        scopedXpathMap[encId] = prefixXPath(abs, xp);
      }
    }

    const scopedUrlMap: Record<string, string> = { ...urlMap };

    const snapshot: HybridSnapshot = {
      combinedTree: outline,
      combinedXpathMap: scopedXpathMap,
      combinedUrlMap: scopedUrlMap,
      perFrame: [
        {
          frameId: targetFrameId,
          outline,
          xpathMap,
          urlMap,
        },
      ],
    };

    if (scopeApplied) {
      return snapshot;
    }

    logScopeFallback();
  } catch {
    logScopeFallback();
  }
  return null;
}

/**
 * Step 2 – call DOM.getDocument once per unique CDP session and hydrate the
 * result so per-frame slices can share the structure. We key by session id
 * because same process iframes live inside the same session.
 */
export async function buildSessionIndexes(
  page: Page,
  frames: string[],
  pierce: boolean,
): Promise<Map<string, SessionDomIndex>> {
  const sessionToIndex = new Map<string, SessionDomIndex>();
  const sessionById = new Map<string, CDPSessionLike>();
  for (const frameId of frames) {
    const sess = ownerSession(page, frameId);
    const sid = sess.id ?? "root";
    if (!sessionById.has(sid)) sessionById.set(sid, sess);
  }
  for (const [sid, sess] of sessionById.entries()) {
    const idx = await buildSessionDomIndex(sess, pierce);
    sessionToIndex.set(sid, idx);
  }
  return sessionToIndex;
}

/**
 * Step 3 – derive per-frame DOM maps and accessibility outlines.
 * Each frame:
 *  - slices the shared session index down to its document root
 *  - builds frame-aware encoded ids (ordinal-backendNodeId)
 *  - collects tag/xpath/scrollability maps for DOM-based lookups
 *  - fetches its AX tree to produce outlines and URL maps
 */
export async function collectPerFrameMaps(
  page: Page,
  context: FrameContext,
  sessionToIndex: Map<string, SessionDomIndex>,
  options: SnapshotOptions | undefined,
  pierce: boolean,
  frameIds: string[],
): Promise<{
  perFrameMaps: Map<string, FrameDomMaps>;
  perFrameOutlines: Array<{ frameId: string; outline: string }>;
}> {
  const perFrameMaps = new Map<string, FrameDomMaps>();
  const perFrameOutlines: Array<{ frameId: string; outline: string }> = [];

  for (const frameId of frameIds) {
    const sess = ownerSession(page, frameId);
    const sid = sess.id ?? "root";
    let idx = sessionToIndex.get(sid);
    if (!idx) {
      idx = await buildSessionDomIndex(sess, pierce);
      sessionToIndex.set(sid, idx);
    }

    const parentId = context.parentByFrame.get(frameId);
    const sameSessionAsParent =
      !!parentId && ownerSession(page, parentId) === sess;
    let docRootBe = idx.rootBackend;
    if (sameSessionAsParent) {
      try {
        const { backendNodeId } = await sess.send<{ backendNodeId?: number }>(
          "DOM.getFrameOwner",
          { frameId },
        );
        if (typeof backendNodeId === "number") {
          const cdBe = idx.contentDocRootByIframe.get(backendNodeId);
          if (typeof cdBe === "number") docRootBe = cdBe;
        }
      } catch {
        //
      }
    }

    const tagNameMap: Record<string, string> = {};
    const xpathMap: Record<string, string> = {};
    const scrollableMap: Record<string, boolean> = {};
    const enc = (be: number) => `${page.getOrdinal(frameId)}-${be}`;
    const baseAbs = idx.absByBe.get(docRootBe) ?? "/";

    for (const [be, nodeAbs] of idx.absByBe.entries()) {
      const nodeDocRoot = idx.docRootOf.get(be);
      if (nodeDocRoot !== docRootBe) continue;

      // Translate absolute XPaths into document-relative ones for this frame.
      const rel = relativizeXPath(baseAbs, nodeAbs);
      const key = enc(be);
      xpathMap[key] = rel;
      const tag = idx.tagByBe.get(be);
      if (tag) tagNameMap[key] = tag;
      if (idx.scrollByBe.get(be)) scrollableMap[key] = true;
    }

    const { outline, urlMap } = await a11yForFrame(sess, frameId, {
      experimental: options?.experimental ?? false,
      tagNameMap,
      scrollableMap,
      encode: (backendNodeId) => `${page.getOrdinal(frameId)}-${backendNodeId}`,
    });

    perFrameOutlines.push({ frameId, outline });
    perFrameMaps.set(frameId, { tagNameMap, xpathMap, scrollableMap, urlMap });
  }

  return { perFrameMaps, perFrameOutlines };
}

/**
 * Step 4 – walk the frame tree (parent-first) to compute absolute prefixes for
 * every frame. The prefix is the absolute XPath of the iframe element hosting
 * the frame, so we can later convert relative XPaths into cross-frame ones.
 */
export async function computeFramePrefixes(
  page: Page,
  context: FrameContext,
  perFrameMaps: Map<string, FrameDomMaps>,
  frameIds: string[],
): Promise<{
  absPrefix: Map<string, string>;
  iframeHostEncByChild: Map<string, string>;
}> {
  const absPrefix = new Map<string, string>();
  const iframeHostEncByChild = new Map<string, string>();
  absPrefix.set(context.rootId, "");
  const included = new Set(frameIds);

  const queue: string[] = [];
  if (included.has(context.rootId)) {
    queue.push(context.rootId);
  }

  while (queue.length) {
    const parent = queue.shift()!;
    const parentAbs = absPrefix.get(parent)!;

    for (const child of context.frames) {
      if (!included.has(child)) continue;
      if (context.parentByFrame.get(child) !== parent) continue;
      queue.push(child);

      const parentSess = parentSession(page, context.parentByFrame, child);

      const ownerBackendNodeId = await (async () => {
        try {
          const { backendNodeId } = await parentSess.send<{
            backendNodeId?: number;
          }>("DOM.getFrameOwner", { frameId: child });
          return backendNodeId;
        } catch {
          return undefined;
        }
      })();

      if (!ownerBackendNodeId) {
        // OOPIFs resolved via a different session inherit the parent prefix.
        absPrefix.set(child, parentAbs);
        continue;
      }

      const parentDom = perFrameMaps.get(parent);
      const iframeEnc = `${page.getOrdinal(parent)}-${ownerBackendNodeId}`;
      const iframeXPath = parentDom?.xpathMap[iframeEnc];

      const childAbs = iframeXPath
        ? prefixXPath(parentAbs || "/", iframeXPath)
        : parentAbs;

      absPrefix.set(child, childAbs);
      iframeHostEncByChild.set(child, iframeEnc);
    }
  }

  return { absPrefix, iframeHostEncByChild };
}

/**
 * Step 5 – merge per-frame maps into the combined snapshot payload. We prefix
 * each frame's relative XPaths with the absolute path collected in step 4,
 * merge URL maps, and stitch text outlines by nesting child trees under the
 * encoded id of their parent iframe host.
 */
export function mergeFramesIntoSnapshot(
  context: FrameContext,
  perFrameMaps: Map<string, FrameDomMaps>,
  perFrameOutlines: Array<{ frameId: string; outline: string }>,
  absPrefix: Map<string, string>,
  iframeHostEncByChild: Map<string, string>,
  frameIds: string[],
): HybridSnapshot {
  const combinedXpathMap: Record<string, string> = {};
  const combinedUrlMap: Record<string, string> = {};

  for (const frameId of frameIds) {
    const maps = perFrameMaps.get(frameId);
    if (!maps) continue;

    const abs = absPrefix.get(frameId) ?? "";
    const isRoot = abs === "" || abs === "/";

    if (isRoot) {
      Object.assign(combinedXpathMap, maps.xpathMap);
      Object.assign(combinedUrlMap, maps.urlMap);
      continue;
    }

    for (const [encId, xp] of Object.entries(maps.xpathMap)) {
      combinedXpathMap[encId] = prefixXPath(abs, xp);
    }
    Object.assign(combinedUrlMap, maps.urlMap);
  }

  const idToTree = new Map<string, string>();
  for (const { frameId, outline } of perFrameOutlines) {
    const parentEnc = iframeHostEncByChild.get(frameId);
    // The key is the parent iframe's encoded id so injectSubtrees can nest lines.
    if (parentEnc) idToTree.set(parentEnc, outline);
  }

  const rootOutline =
    perFrameOutlines.find((o) => o.frameId === context.rootId)?.outline ??
    perFrameOutlines[0]?.outline ??
    "";
  const combinedTree = injectSubtrees(rootOutline, idToTree);

  return {
    combinedTree,
    combinedXpathMap,
    combinedUrlMap,
    perFrame: perFrameOutlines.map(({ frameId, outline }) => {
      const maps = perFrameMaps.get(frameId);
      return {
        frameId,
        outline,
        xpathMap: maps?.xpathMap ?? {},
        urlMap: maps?.urlMap ?? {},
      };
    }),
  };
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/coordinateResolver.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "../../cdp.js";
import { Page } from "../../page.js";
import { executionContexts } from "../../executionContextRegistry.js";
import { a11yScriptSources } from "../../../dom/build/a11yScripts.generated.js";
import { buildA11yInvocation } from "../../a11yInvocation.js";
import type { ResolvedLocation } from "../../../types/private/snapshot.js";
import { listChildrenOf } from "./focusSelectors.js";
import { buildAbsoluteXPathFromChain } from "./xpathUtils.js";

/**
 * Resolve deepest node for a page coordinate and compute its absolute XPath across frames.
 * More efficient than building a full hybrid snapshot when only a single node’s XPath is needed.
 */
export async function resolveXpathForLocation(
  page: Page,
  x: number,
  y: number,
): Promise<ResolvedLocation | null> {
  const tree = page.getFullFrameTree();
  const parentByFrame = new Map<string, string | null>();
  (function index(n: Protocol.Page.FrameTree, parent: string | null) {
    parentByFrame.set(n.frame.id, parent);
    for (const c of n.childFrames ?? []) index(c, n.frame.id);
  })(tree, null);

  const iframeChain: Array<{
    parentSession: CDPSessionLike;
    iframeBackendNodeId: number;
  }> = [];

  let curFrameId = page.mainFrameId();
  let curSession = page.getSessionForFrame(curFrameId);
  let curX = x;
  let curY = y;

  for (let depth = 0; depth < 8; depth++) {
    try {
      await curSession.send("DOM.enable").catch(() => {});

      let sx = 0;
      let sy = 0;
      try {
        await curSession.send("Runtime.enable").catch(() => {});
        const ctxId = await executionContexts
          .waitForMainWorld(curSession, curFrameId)
          .catch(() => {});
        const scrollExpr = buildA11yInvocation("getScrollOffsets", []);
        const evalParams = ctxId
          ? {
              contextId: ctxId,
              expression: scrollExpr,
              returnByValue: true,
            }
          : { expression: scrollExpr, returnByValue: true };
        const { result } = await curSession.send<{
          result: { value?: { sx?: number; sy?: number } };
        }>("Runtime.evaluate", evalParams);
        sx = Number(result?.value?.sx ?? 0);
        sy = Number(result?.value?.sy ?? 0);
      } catch {
        //
      }
      const xi = Math.max(0, Math.floor(curX + sx));
      const yi = Math.max(0, Math.floor(curY + sy));

      let res: { backendNodeId?: number; frameId?: string } | undefined;
      try {
        res = await curSession.send<{
          backendNodeId?: number;
          frameId?: string;
        }>("DOM.getNodeForLocation", {
          x: xi,
          y: yi,
          includeUserAgentShadowDOM: false,
          ignorePointerEventsNone: false,
        });
      } catch {
        return null;
      }

      const be = res?.backendNodeId;
      const reportedFrameId = res?.frameId;
      if (
        typeof be === "number" &&
        reportedFrameId &&
        reportedFrameId !== curFrameId
      ) {
        const abs = await buildAbsoluteXPathFromChain(
          iframeChain,
          curSession,
          be,
        );
        return abs
          ? { frameId: reportedFrameId, backendNodeId: be, absoluteXPath: abs }
          : null;
      }

      if (typeof be !== "number") return null;

      let matchedChild: string | undefined;
      for (const fid of listChildrenOf(parentByFrame, curFrameId)) {
        try {
          const { backendNodeId } = await curSession.send<{
            backendNodeId?: number;
          }>("DOM.getFrameOwner", { frameId: fid });
          if (backendNodeId === be) {
            matchedChild = fid;
            break;
          }
        } catch {
          continue;
        }
      }

      if (!matchedChild) {
        const abs = await buildAbsoluteXPathFromChain(
          iframeChain,
          curSession,
          be,
        );
        return abs
          ? { frameId: curFrameId, backendNodeId: be, absoluteXPath: abs }
          : null;
      }

      iframeChain.push({
        parentSession: curSession,
        iframeBackendNodeId: be,
      });

      let left = 0;
      let top = 0;
      try {
        const { object } = await curSession.send<{
          object: { objectId?: string };
        }>("DOM.resolveNode", { backendNodeId: be });
        const objectId = object?.objectId;
        if (objectId) {
          const { result } = await curSession.send<{
            result: { value?: { left: number; top: number } };
          }>("Runtime.callFunctionOn", {
            objectId,
            functionDeclaration: a11yScriptSources.getBoundingRectLite,
            returnByValue: true,
          });
          left = Number(result?.value?.left ?? 0);
          top = Number(result?.value?.top ?? 0);
          await curSession
            .send("Runtime.releaseObject", { objectId })
            .catch(() => {});
        }
      } catch {
        //
      }
      curX = Math.max(0, curX - left);
      curY = Math.max(0, curY - top);
      curFrameId = matchedChild;
      curSession = page.getSessionForFrame(curFrameId);
    } catch {
      return null;
    }
  }
  return null;
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/domTree.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "../../cdp.js";
import { StagehandDomProcessError } from "../../../types/public/sdkErrors.js";
import type { SessionDomIndex } from "../../../types/private/snapshot.js";
import {
  buildChildXPathSegments,
  joinXPath,
  normalizeXPath,
} from "./xpathUtils.js";

// starting from infinite depth (-1), exponentially shrink down to 1
const DOM_DEPTH_ATTEMPTS = [-1, 256, 128, 64, 32, 16, 8, 4, 2, 1];
const DESCRIBE_DEPTH_ATTEMPTS = [-1, 64, 32, 16, 8, 4, 2, 1];

/** Identify CDP failures caused by deep DOM trees blowing the CBOR encoder stack. */
function isCborStackError(message: string): boolean {
  return message.includes("CBOR: stack limit exceeded");
}

/**
 * Determine if CDP truncated a node's children when streaming the DOM tree.
 * childNodeCount stays accurate even when `children` are omitted; we use this to
 * decide whether DOM.describeNode must be re-run for that node.
 */
export function shouldExpandNode(node: Protocol.DOM.Node): boolean {
  const declaredChildren = node.childNodeCount ?? 0;
  const realizedChildren = node.children?.length ?? 0;
  return declaredChildren > realizedChildren;
}

/** Merge an expanded DescribeNode payload back into the original shallow node. */
export function mergeDomNodes(
  target: Protocol.DOM.Node,
  source: Protocol.DOM.Node,
): void {
  target.childNodeCount = source.childNodeCount ?? target.childNodeCount;
  target.children = source.children ?? target.children;
  target.shadowRoots = source.shadowRoots ?? target.shadowRoots;
  target.contentDocument = source.contentDocument ?? target.contentDocument;
}

/** Helper that returns every nested collection we recurse through uniformly. */
export function collectDomTraversalTargets(
  node: Protocol.DOM.Node,
): Protocol.DOM.Node[] {
  const targets: Protocol.DOM.Node[] = [];
  if (node.children) targets.push(...node.children);
  if (node.shadowRoots) targets.push(...node.shadowRoots);
  if (node.contentDocument) targets.push(node.contentDocument);
  return targets;
}

/**
 * Rehydrate a truncated DOM tree by repeatedly calling DOM.describeNode with
 * decreasing depths. Any non-CBOR failure is surfaced as a StagehandDomProcessError.
 */
export async function hydrateDomTree(
  session: CDPSessionLike,
  root: Protocol.DOM.Node,
  pierce: boolean,
): Promise<void> {
  const stack: Protocol.DOM.Node[] = [root];
  const expandedNodeIds = new Set<number>();
  const expandedBackendIds = new Set<number>();

  while (stack.length) {
    const node = stack.pop()!;
    const nodeId =
      typeof node.nodeId === "number" && node.nodeId > 0
        ? node.nodeId
        : undefined;
    const backendId =
      typeof node.backendNodeId === "number" && node.backendNodeId > 0
        ? node.backendNodeId
        : undefined;

    const seenByNode = nodeId ? expandedNodeIds.has(nodeId) : false;
    const seenByBackend =
      !nodeId && backendId ? expandedBackendIds.has(backendId) : false;
    if (seenByNode || seenByBackend) continue;
    if (nodeId) expandedNodeIds.add(nodeId);
    else if (backendId) expandedBackendIds.add(backendId);

    const needsExpansion = shouldExpandNode(node);
    if (needsExpansion && (nodeId || backendId)) {
      const describeParamsBase = nodeId
        ? { nodeId }
        : { backendNodeId: backendId! };
      let expanded = false;
      for (const depth of DESCRIBE_DEPTH_ATTEMPTS) {
        try {
          const described =
            await session.send<Protocol.DOM.DescribeNodeResponse>(
              "DOM.describeNode",
              {
                ...describeParamsBase,
                depth,
                pierce,
              },
            );
          mergeDomNodes(node, described.node);
          if (!nodeId && described.node.nodeId && described.node.nodeId > 0) {
            node.nodeId = described.node.nodeId;
            expandedNodeIds.add(described.node.nodeId);
          }
          expanded = true;
          break;
        } catch (err) {
          const message = err instanceof Error ? err.message : String(err);
          if (isCborStackError(message)) {
            continue;
          }
          const identifier = nodeId ?? backendId ?? "unknown";
          throw new StagehandDomProcessError(
            `Failed to expand DOM node ${identifier}: ${String(err)}`,
          );
        }
      }
      if (!expanded) {
        const identifier = nodeId ?? backendId ?? "unknown";
        throw new StagehandDomProcessError(
          `Unable to expand DOM node ${identifier} after describeNode depth retries`,
        );
      }
    }

    for (const child of collectDomTraversalTargets(node)) {
      stack.push(child);
    }
  }
}

/**
 * Attempt DOM.getDocument with progressively shallower depths until CBOR stops
 * complaining. When a shallower snapshot is returned we hydrate the missing
 * branches so downstream DOM traversals see the full tree shape.
 */
export async function getDomTreeWithFallback(
  session: CDPSessionLike,
  pierce: boolean,
): Promise<Protocol.DOM.Node> {
  let lastCborMessage = "";

  for (const depth of DOM_DEPTH_ATTEMPTS) {
    try {
      const { root } = await session.send<{ root: Protocol.DOM.Node }>(
        "DOM.getDocument",
        { depth, pierce },
      );

      if (depth !== -1) {
        await hydrateDomTree(session, root, pierce);
      }

      return root;
    } catch (err) {
      const message = err instanceof Error ? err.message : String(err);
      if (isCborStackError(message)) {
        lastCborMessage = message;
        continue;
      }
      throw err;
    }
  }

  throw new StagehandDomProcessError(
    lastCborMessage
      ? `CDP DOM.getDocument failed after adaptive depth retries: ${lastCborMessage}`
      : "CDP DOM.getDocument failed after adaptive depth retries.",
  );
}

/**
 * Build tag name and XPath maps for a single frame session.
 * EncodedId is produced by a frame-aware encoder provided by the caller.
 */
export async function domMapsForSession(
  session: CDPSessionLike,
  frameId: string,
  pierce: boolean,
  encode: (fid: string, backendNodeId: number) => string,
  attemptOwnerLookup = true,
): Promise<{
  tagNameMap: Record<string, string>;
  xpathMap: Record<string, string>;
  scrollableMap: Record<string, boolean>;
}> {
  await session.send("DOM.enable").catch(() => {});
  const root = await getDomTreeWithFallback(session, pierce);

  let startNode: Protocol.DOM.Node = root;
  if (attemptOwnerLookup) {
    try {
      const owner = await session.send<{ backendNodeId?: number }>(
        "DOM.getFrameOwner",
        { frameId },
      );
      const ownerBackendId = owner.backendNodeId;
      if (typeof ownerBackendId === "number") {
        const ownerEl = findNodeByBackendId(root, ownerBackendId);
        if (ownerEl?.contentDocument) {
          startNode = ownerEl.contentDocument;
        }
      }
    } catch {
      // OOPIF or race → keep startNode = root
    }
  }

  const tagNameMap: Record<string, string> = {};
  const xpathMap: Record<string, string> = {};
  const scrollableMap: Record<string, boolean> = {};

  type StackEntry = { node: Protocol.DOM.Node; xpath: string };
  const stack: StackEntry[] = [{ node: startNode, xpath: "" }];

  while (stack.length) {
    const { node, xpath } = stack.pop()!;

    if (node.backendNodeId) {
      const encId = encode(frameId, node.backendNodeId);
      tagNameMap[encId] = String(node.nodeName).toLowerCase();
      xpathMap[encId] = xpath || "/";
      const isScrollable = node?.isScrollable === true;
      if (isScrollable) scrollableMap[encId] = true;
    }

    const kids = node.children ?? [];
    if (kids.length) {
      const segs = buildChildXPathSegments(kids);
      for (let i = kids.length - 1; i >= 0; i--) {
        const child = kids[i]!;
        const step = segs[i]!;
        stack.push({
          node: child,
          xpath: joinXPath(xpath, step),
        });
      }
    }

    for (const sr of node.shadowRoots ?? []) {
      stack.push({
        node: sr,
        xpath: joinXPath(xpath, "//"),
      });
    }
  }

  return { tagNameMap, xpathMap, scrollableMap };
}

/**
 * Build an index of absolute XPath/tag metadata for an entire CDP session.
 * Once the index is cached, per-frame slices are derived without extra DOM
 * calls, which keeps snapshot capture linear in the number of frames.
 */
export async function buildSessionDomIndex(
  session: CDPSessionLike,
  pierce: boolean,
): Promise<SessionDomIndex> {
  await session.send("DOM.enable").catch(() => {});
  const root = await getDomTreeWithFallback(session, pierce);

  const absByBe = new Map<number, string>();
  const tagByBe = new Map<number, string>();
  const scrollByBe = new Map<number, boolean>();
  const docRootOf = new Map<number, number>();
  const contentDocRootByIframe = new Map<number, number>();

  type Entry = { node: Protocol.DOM.Node; xp: string; docRootBe: number };
  const rootBe = root.backendNodeId!;
  const stack: Entry[] = [{ node: root, xp: "/", docRootBe: rootBe }];

  while (stack.length) {
    const { node, xp, docRootBe } = stack.pop()!;
    if (node.backendNodeId) {
      absByBe.set(node.backendNodeId, xp || "/");
      tagByBe.set(node.backendNodeId, String(node.nodeName).toLowerCase());
      if (node?.isScrollable === true) scrollByBe.set(node.backendNodeId, true);
      docRootOf.set(node.backendNodeId, docRootBe);
    }

    const kids = node.children ?? [];
    if (kids.length) {
      const segs = buildChildXPathSegments(kids);
      for (let i = kids.length - 1; i >= 0; i--) {
        const child = kids[i]!;
        const step = segs[i]!;
        stack.push({ node: child, xp: joinXPath(xp, step), docRootBe });
      }
    }

    for (const sr of node.shadowRoots ?? []) {
      stack.push({ node: sr, xp: joinXPath(xp, "//"), docRootBe });
    }

    const cd = node.contentDocument as Protocol.DOM.Node | undefined;
    if (cd && typeof cd.backendNodeId === "number") {
      contentDocRootByIframe.set(node.backendNodeId!, cd.backendNodeId);
      stack.push({ node: cd, xp, docRootBe: cd.backendNodeId });
    }
  }

  return {
    rootBackend: rootBe,
    absByBe,
    tagByBe,
    scrollByBe,
    docRootOf,
    contentDocRootByIframe,
  };
}

/**
 * Relativize an absolute XPath against a document root's absolute path.
 * When the node lives outside the document we return the absolute path as-is.
 */
export function relativizeXPath(baseAbs: string, nodeAbs: string): string {
  const base = normalizeXPath(baseAbs);
  const abs = normalizeXPath(nodeAbs);
  if (abs === base) return "/";
  if (abs.startsWith(base)) {
    const tail = abs.slice(base.length);
    if (!tail) return "/";
    return tail.startsWith("/") || tail.startsWith("//") ? tail : `/${tail}`;
  }
  if (base === "/") return abs;
  return abs;
}

/** Find a node by backendNodeId inside a DOM.getDocument tree. */
export function findNodeByBackendId(
  root: Protocol.DOM.Node,
  backendNodeId: number,
): Protocol.DOM.Node | undefined {
  const stack: Protocol.DOM.Node[] = [root];
  while (stack.length) {
    const n = stack.pop()!;
    if (n.backendNodeId === backendNodeId) return n;
    if (n.children) for (const c of n.children) stack.push(c);
    if (n.shadowRoots) for (const s of n.shadowRoots) stack.push(s);
  }
  return undefined;
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/focusSelectors.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "../../cdp.js";
import { Page } from "../../page.js";
import { executionContexts } from "../../executionContextRegistry.js";
import { buildLocatorInvocation } from "../../locatorInvocation.js";
import { StagehandIframeError } from "../../../types/public/sdkErrors.js";
import type {
  Axis,
  FrameParentIndex,
  ResolvedCssFocus,
  ResolvedFocusFrame,
  Step,
} from "../../../types/private/snapshot.js";
import { prefixXPath } from "./xpathUtils.js";

/**
 * Parse a cross-frame XPath into discrete steps. Each step tracks whether it
 * represents a descendant hop (“//”) or a single-child hop (“/”).
 */
export function parseXPathToSteps(path: string): Step[] {
  const s = path.trim();
  let i = 0;
  const steps: Step[] = [];
  while (i < s.length) {
    let axis: Axis = "child";
    if (s.startsWith("//", i)) {
      axis = "desc";
      i += 2;
    } else if (s[i] === "/") {
      axis = "child";
      i += 1;
    }

    const start = i;
    while (i < s.length && s[i] !== "/") i++;
    const raw = s.slice(start, i).trim();
    if (!raw) continue;
    const name = raw.replace(/\[\d+\]\s*$/u, "").toLowerCase();
    steps.push({ axis, raw, name });
  }
  return steps;
}

/** Rebuild an XPath string from parsed steps. */
export function buildXPathFromSteps(steps: ReadonlyArray<Step>): string {
  let out = "";
  for (const st of steps) {
    out += st.axis === "desc" ? "//" : "/";
    out += st.raw;
  }
  return out || "/";
}

export const IFRAME_STEP_RE = /^i?frame(?:\[\d+])?$/i;

/**
 * Given a cross-frame XPath, walk iframe steps to resolve:
 * - the target frameId (last iframe hop)
 * - the tail XPath (within the target frame)
 * - the absolute XPath prefix up to the iframe element hosting that frame
 */
export async function resolveFocusFrameAndTail(
  page: Page,
  absoluteXPath: string,
  parentByFrame: FrameParentIndex,
  rootId: string,
): Promise<ResolvedFocusFrame> {
  const steps = parseXPathToSteps(absoluteXPath);
  let ctxFrameId = rootId;
  let buf: Step[] = [];
  let absPrefix = "";

  const flushIntoChild = async (): Promise<void> => {
    if (!buf.length) return;
    const selectorForIframe = buildXPathFromSteps(buf);
    const parentSess = page.getSessionForFrame(ctxFrameId);
    const objectId = await resolveObjectIdForXPath(
      parentSess,
      selectorForIframe,
      ctxFrameId,
    );
    if (!objectId)
      throw new StagehandIframeError(
        selectorForIframe,
        "Failed to resolve iframe element by XPath",
      );

    try {
      await parentSess.send("DOM.enable").catch(() => {});
      const desc = await parentSess.send<Protocol.DOM.DescribeNodeResponse>(
        "DOM.describeNode",
        { objectId },
      );
      const iframeBackendNodeId = desc.node.backendNodeId;

      let childFrameId: string | undefined;
      for (const fid of listChildrenOf(parentByFrame, ctxFrameId)) {
        try {
          const { backendNodeId } = await parentSess.send<{
            backendNodeId: number;
          }>("DOM.getFrameOwner", { frameId: fid });
          if (backendNodeId === iframeBackendNodeId) {
            childFrameId = fid;
            break;
          }
        } catch {
          continue;
        }
      }
      if (!childFrameId)
        throw new StagehandIframeError(
          selectorForIframe,
          "Could not map iframe to child frameId",
        );

      absPrefix = prefixXPath(absPrefix || "/", selectorForIframe);
      ctxFrameId = childFrameId;
    } finally {
      await parentSess
        .send("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }

    buf = [];
  };

  for (const st of steps) {
    buf.push(st);
    if (IFRAME_STEP_RE.test(st.name)) {
      await flushIntoChild();
    }
  }

  const tailXPath = buildXPathFromSteps(buf);
  return { targetFrameId: ctxFrameId, tailXPath, absPrefix };
}

/** Resolve focus frame and tail CSS selector using '>>' to hop iframes. */
export async function resolveCssFocusFrameAndTail(
  page: Page,
  rawSelector: string,
  parentByFrame: FrameParentIndex,
  rootId: string,
): Promise<ResolvedCssFocus> {
  const parts = rawSelector
    .split(">>")
    .map((s) => s.trim())
    .filter(Boolean);
  let ctxFrameId = rootId;
  const absPrefix = "";

  for (let i = 0; i < Math.max(0, parts.length - 1); i++) {
    const parentSess = page.getSessionForFrame(ctxFrameId);
    const objectId = await resolveObjectIdForCss(
      parentSess,
      parts[i]!,
      ctxFrameId,
    );
    if (!objectId)
      throw new StagehandIframeError(
        parts[i]!,
        "Failed to resolve iframe via CSS hop",
      );
    try {
      await parentSess.send("DOM.enable").catch(() => {});
      const desc = await parentSess.send<Protocol.DOM.DescribeNodeResponse>(
        "DOM.describeNode",
        { objectId },
      );
      const iframeBackendNodeId = desc.node.backendNodeId;
      let childFrameId: string | undefined;
      for (const fid of listChildrenOf(parentByFrame, ctxFrameId)) {
        try {
          const { backendNodeId } = await parentSess.send<{
            backendNodeId: number;
          }>("DOM.getFrameOwner", { frameId: fid });
          if (backendNodeId === iframeBackendNodeId) {
            childFrameId = fid;
            break;
          }
        } catch {
          continue;
        }
      }
      if (!childFrameId)
        throw new StagehandIframeError(
          parts[i]!,
          "Could not map CSS iframe hop to child frameId",
        );
      ctxFrameId = childFrameId;
    } finally {
      await parentSess
        .send("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  const tailSelector = parts[parts.length - 1] ?? "*";
  return { targetFrameId: ctxFrameId, tailSelector, absPrefix };
}

/** Resolve an XPath to a Runtime remoteObjectId in the given CDP session. */
export async function resolveObjectIdForXPath(
  session: CDPSessionLike,
  xpath: string,
  frameId?: string,
): Promise<string | null> {
  let contextId: number | undefined;
  try {
    if (frameId) {
      contextId = await executionContexts
        .waitForMainWorld(session, frameId, 800)
        .catch(
          () => executionContexts.getMainWorld(session, frameId) ?? undefined,
        );
    }
  } catch {
    contextId = undefined;
  }
  const expr = buildLocatorInvocation("resolveXPathMainWorld", [
    JSON.stringify(xpath),
    "0",
  ]);
  const { result, exceptionDetails } = await session.send<{
    result: { objectId?: string | undefined };
    exceptionDetails?: Protocol.Runtime.ExceptionDetails;
  }>("Runtime.evaluate", {
    expression: expr,
    returnByValue: false,
    contextId,
    awaitPromise: true,
  });
  if (exceptionDetails) return null;
  return result?.objectId ?? null;
}

/** Resolve a CSS selector (supports '>>' within the same frame only) to a Runtime objectId. */
export async function resolveObjectIdForCss(
  session: CDPSessionLike,
  selector: string,
  frameId?: string,
): Promise<string | null> {
  let contextId: number | undefined;
  try {
    if (frameId) {
      contextId = await executionContexts
        .waitForMainWorld(session, frameId, 800)
        .catch(
          () => executionContexts.getMainWorld(session, frameId) ?? undefined,
        );
    }
  } catch {
    contextId = undefined;
  }
  const primaryExpr = buildLocatorInvocation("resolveCssSelector", [
    JSON.stringify(selector),
    "0",
  ]);
  const fallbackExpr = buildLocatorInvocation("resolveCssSelectorPierce", [
    JSON.stringify(selector),
    "0",
  ]);

  const evaluate = async (expression: string): Promise<string | null> => {
    const { result, exceptionDetails } = await session.send<{
      result: { objectId?: string | undefined };
      exceptionDetails?: Protocol.Runtime.ExceptionDetails;
    }>("Runtime.evaluate", {
      expression,
      returnByValue: false,
      contextId,
      awaitPromise: true,
    });
    if (exceptionDetails) return null;
    return result?.objectId ?? null;
  };

  const primary = await evaluate(primaryExpr);
  if (primary) return primary;
  return evaluate(fallbackExpr);
}

export function listChildrenOf(
  parentByFrame: FrameParentIndex,
  parentId: string,
): string[] {
  const out: string[] = [];
  for (const [fid, p] of parentByFrame.entries()) {
    if (p === parentId) out.push(fid);
  }
  return out;
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/index.ts
================================================
export { captureHybridSnapshot } from "./capture.js";
export { computeActiveElementXpath } from "./activeElement.js";
export { diffCombinedTrees } from "./treeFormatUtils.js";
export { resolveXpathForLocation } from "./coordinateResolver.js";


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/sessions.ts
================================================
import type { CDPSessionLike } from "../../cdp.js";
import { Page } from "../../page.js";
import type { FrameParentIndex } from "../../../types/private/snapshot.js";

/**
 * Session helpers ensure DOM lookups are always executed against the session
 * that actually owns a frame. Keeping this logic centralized prevents subtle
 * bugs when OOPIF adoption changes session ownership mid-capture.
 */

/** Return the owning session for a frame as registered on the Page. */
export function ownerSession(page: Page, frameId: string): CDPSessionLike {
  return page.getSessionForFrame(frameId);
}

/**
 * DOM.getFrameOwner must be called against the parent frame's session.
 * This helper hides the lookup (including main-frame fallback) so callers
 * always reach for the correct connection.
 */
export function parentSession(
  page: Page,
  parentByFrame: FrameParentIndex,
  frameId: string,
): CDPSessionLike {
  const parentId = parentByFrame.get(frameId) ?? null;
  if (!parentId) {
    return page.getSessionForFrame(frameId);
  }
  return page.getSessionForFrame(parentId);
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/treeFormatUtils.ts
================================================
import type { A11yNode } from "../../../types/private/snapshot.js";

/**
 * Render a formatted outline (with encoded ids) for the accessibility tree.
 * Keeps indentation logic shared between modules so unit tests can cover these
 * pure formatting helpers without a full snapshot pipeline.
 */
export function formatTreeLine(node: A11yNode, level = 0): string {
  const indent = "  ".repeat(level);
  const labelId = node.encodedId ?? node.nodeId;
  const label = `[${labelId}] ${node.role}${node.name ? `: ${cleanText(node.name)}` : ""}`;
  const kids =
    node.children?.map((c) => formatTreeLine(c, level + 1)).join("\n") ?? "";
  return kids ? `${indent}${label}\n${kids}` : `${indent}${label}`;
}

/**
 * Inject each child frame outline under the parent's iframe node line.
 * Keys in `idToTree` are the parent's iframe encoded ids.
 */
export function injectSubtrees(
  rootOutline: string,
  idToTree: Map<string, string>,
): string {
  type Frame = { lines: string[]; i: number };
  const out: string[] = [];
  const visited = new Set<string>();
  const stack: Frame[] = [{ lines: rootOutline.split("\n"), i: 0 }];

  while (stack.length) {
    const top = stack[stack.length - 1];
    if (top.i >= top.lines.length) {
      stack.pop();
      continue;
    }

    const raw = top.lines[top.i++];
    out.push(raw);

    const indent = raw.match(/^(\s*)/)?.[1] ?? "";
    const content = raw.slice(indent.length);

    const m = content.match(/^\[([^\]]+)]/);
    if (!m) continue;

    const encId = m[1]!;
    const childOutline = idToTree.get(encId);
    if (!childOutline || visited.has(encId)) continue;

    visited.add(encId);

    const fullyInjectedChild = injectSubtrees(childOutline, idToTree);
    out.push(indentBlock(fullyInjectedChild.trimEnd(), indent + "  "));
  }

  return out.join("\n");
}

export function indentBlock(block: string, indent: string): string {
  if (!block) return "";
  return block
    .split("\n")
    .map((line) => (line.length ? indent + line : indent + line))
    .join("\n");
}

/**
 * Return the lines that appear in `nextTree` but not in `prevTree`.
 * Comparison is done line-by-line, ignoring leading whitespace in both trees.
 * The returned block is re-indented so the minimal indent becomes column 0.
 */
export function diffCombinedTrees(prevTree: string, nextTree: string): string {
  const prevSet = new Set(
    (prevTree || "")
      .split("\n")
      .map((l) => l.trim())
      .filter((l) => l.length > 0),
  );

  const nextLines = (nextTree || "").split("\n");
  const added: string[] = [];
  for (const line of nextLines) {
    const core = line.trim();
    if (!core) continue;
    if (!prevSet.has(core)) added.push(line);
  }

  if (added.length === 0) return "";

  let minIndent = Infinity;
  for (const l of added) {
    if (!l.trim()) continue;
    const m = l.match(/^\s*/);
    const indentLen = m ? m[0]!.length : 0;
    if (indentLen < minIndent) minIndent = indentLen;
  }
  if (!isFinite(minIndent)) minIndent = 0;

  const out = added.map((l) =>
    l.length >= minIndent ? l.slice(minIndent) : l,
  );
  return out.join("\n");
}

/**
 * Remove whitespace noise and invisible code points before rendering names.
 */
export function cleanText(input: string): string {
  const PUA_START = 0xe000;
  const PUA_END = 0xf8ff;
  const NBSP = new Set<number>([0x00a0, 0x202f, 0x2007, 0xfeff]);

  let out = "";
  let prevSpace = false;
  for (let i = 0; i < input.length; i++) {
    const code = input.charCodeAt(i);
    if (code >= PUA_START && code <= PUA_END) continue;
    if (NBSP.has(code)) {
      if (!prevSpace) {
        out += " ";
        prevSpace = true;
      }
      continue;
    }
    out += input[i];
    prevSpace = input[i] === " ";
  }
  return out.trim();
}

/**
 * Collapse all whitespace runs in a string to a single space without trimming.
 * Exported for pruning routines that need the same normalization.
 */
export function normaliseSpaces(s: string): string {
  let out = "";
  let inWs = false;
  for (let i = 0; i < s.length; i++) {
    const ch = s[i]!;
    const isWs = /\s/.test(ch);
    if (isWs) {
      if (!inWs) {
        out += " ";
        inWs = true;
      }
    } else {
      out += ch;
      inWs = false;
    }
  }
  return out;
}


================================================
FILE: packages/core/lib/v3/understudy/a11y/snapshot/xpathUtils.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "../../cdp.js";
import { a11yScriptSources } from "../../../dom/build/a11yScripts.generated.js";

/**
 * Build the absolute XPath for a node by walking through every iframe host
 * we've traversed so far followed by the leaf backend node.
 */
export async function buildAbsoluteXPathFromChain(
  chain: Array<{
    parentSession: CDPSessionLike;
    iframeBackendNodeId: number;
  }>,
  leafSession: CDPSessionLike,
  leafBackendNodeId: number,
): Promise<string | null> {
  let prefix = "";
  for (const step of chain) {
    const xp = await absoluteXPathForBackendNode(
      step.parentSession,
      step.iframeBackendNodeId,
    );
    if (!xp) continue;
    prefix = prefix ? prefixXPath(prefix, xp) : normalizeXPath(xp);
  }
  const leaf = await absoluteXPathForBackendNode(
    leafSession,
    leafBackendNodeId,
  );
  if (!leaf) return prefix || "/";
  return prefix ? prefixXPath(prefix, leaf) : normalizeXPath(leaf);
}

/**
 * Resolve a backend node to an absolute XPath within the provided session.
 * The CDP Runtime is used so we can invoke a small helper that walks the DOM.
 */
export async function absoluteXPathForBackendNode(
  session: CDPSessionLike,
  backendNodeId: number,
): Promise<string | null> {
  try {
    const { object } = await session.send<{ object: { objectId?: string } }>(
      "DOM.resolveNode",
      { backendNodeId },
    );
    const objectId = object?.objectId;
    if (!objectId) return null;

    const { result } = await session.send<{ result: { value?: string } }>(
      "Runtime.callFunctionOn",
      {
        objectId,
        functionDeclaration: a11yScriptSources.nodeToAbsoluteXPath,
        returnByValue: true,
      },
    );
    await session.send("Runtime.releaseObject", { objectId }).catch(() => {});
    return typeof result?.value === "string" && result.value
      ? result.value
      : null;
  } catch {
    return null;
  }
}

/**
 * Prefix `child` XPath with an absolute iframe path `parentAbs`.
 * Handles root slashes and shadow hops (“//”) cleanly.
 */
export function prefixXPath(parentAbs: string, child: string): string {
  const p = parentAbs === "/" ? "" : parentAbs.replace(/\/$/, "");
  if (!child || child === "/") return p || "/";
  if (child.startsWith("//"))
    return p ? `${p}//${child.slice(2)}` : `//${child.slice(2)}`;
  const c = child.replace(/^\//, "");
  return p ? `${p}/${c}` : `/${c}`;
}

/** Normalize an XPath: strip `xpath=`, ensure leading '/', remove trailing '/'. */
export function normalizeXPath(x?: string): string {
  if (!x) return "";
  let s = x.trim().replace(/^xpath=/i, "");
  if (!s.startsWith("/")) s = "/" + s;
  if (s.length > 1 && s.endsWith("/")) s = s.slice(0, -1);
  return s;
}

/** Build per-sibling XPath steps for DOM traversal. */
export function buildChildXPathSegments(kids: Protocol.DOM.Node[]): string[] {
  const segs: string[] = [];
  const ctr: Record<string, number> = {};
  for (const child of kids) {
    const tag = String(child.nodeName).toLowerCase();
    const key = `${child.nodeType}:${tag}`;
    const idx = (ctr[key] = (ctr[key] ?? 0) + 1);
    if (child.nodeType === 3) {
      segs.push(`text()[${idx}]`);
    } else if (child.nodeType === 8) {
      segs.push(`comment()[${idx}]`);
    } else {
      segs.push(
        tag.includes(":") ? `*[name()='${tag}'][${idx}]` : `${tag}[${idx}]`,
      );
    }
  }
  return segs;
}

/** Join two XPath fragments while preserving special shadow-root hops. */
export function joinXPath(base: string, step: string): string {
  if (step === "//") {
    if (!base || base === "/") return "//";
    return base.endsWith("/") ? `${base}/` : `${base}//`;
  }
  if (!base || base === "/") return step ? `/${step}` : "/";
  if (base.endsWith("//")) return `${base}${step}`;
  if (!step) return base;
  return `${base}/${step}`;
}


================================================
FILE: packages/core/lib/v3/understudy/a11yInvocation.ts
================================================
import {
  a11yScriptBootstrap,
  a11yScriptGlobalRefs,
  type A11yScriptName,
} from "../dom/build/a11yScripts.generated.js";

/**
 * Wrap a generated a11y script in a self-invoking expression that first ensures
 * the bootstrap has run, then calls the requested helper via its global ref.
 * This mirrors the locator resolver’s injection path so any CDP Runtime.evaluate
 * can reuse the shared bundle without inlining JS strings.
 */
export function buildA11yInvocation(
  name: A11yScriptName,
  args: string[],
): string {
  const invocation = `${a11yScriptGlobalRefs[name]}(${args.join(", ")})`;
  return `(() => { ${a11yScriptBootstrap}; return ${invocation}; })()`;
}


================================================
FILE: packages/core/lib/v3/understudy/cdp.ts
================================================
// lib/v3/understudy/cdp.ts
import WebSocket from "ws";
import type { Protocol } from "devtools-protocol";
import { STAGEHAND_VERSION } from "../../version.js";
import {
  FlowLogger,
  type FlowEvent,
  type FlowLoggerContext,
} from "../flowlogger/FlowLogger.js";
import {
  CdpConnectionClosedError,
  PageNotFoundError,
} from "../types/public/sdkErrors.js";

/**
 * CDP transport & session multiplexer
 *
 * Owns the browser WebSocket and multiplexes flattened Target sessions.
 * Tracks inflight CDP calls, routes responses to the right session, and forwards events.
 *
 * This does not interpret Page/DOM/Runtime semantics — callers own that logic.
 */
export interface CDPSessionLike {
  send<R = unknown>(method: string, params?: object): Promise<R>;
  on<P = unknown>(event: string, handler: (params: P) => void): void;
  off<P = unknown>(event: string, handler: (params: P) => void): void;
  close(): Promise<void>;
  readonly id: string | null;
}

type Inflight = {
  resolve: (v: unknown) => void;
  reject: (e: Error) => void;
  sessionId?: string | null;
  method: string;
  params?: object;
  stack?: string;
  ts: number;
  flowLoggerContext?: FlowLoggerContext | null; // Snapshot of the flow context captured when the request was sent; response handling re-enters this if ALS is gone.
  cdpCallEvent?: Pick<FlowEvent, "eventId" | "eventParentIds"> | null; // The emitted CdpCallEvent identity; later response/error events attach under this exact parent.
};

type EventHandler = (params: unknown) => void;
type SessionDispatchWaiter = {
  sessionId: string;
  method: string;
  match?: (params?: object) => boolean;
  resolve: () => void;
  reject: (error: Error) => void;
};

type RawMessage =
  | {
      id: number;
      result?: unknown;
      error?: { code: number; message: string; data?: unknown };
      sessionId?: string;
    }
  | { method: string; params?: unknown; sessionId?: string };

export class CdpConnection implements CDPSessionLike {
  private ws: WebSocket;
  private nextId = 1;
  private inflight = new Map<number, Inflight>(); // Outstanding request records; `_sendViaSession()` inserts and `onMessage()` removes/resolves them.
  private latestCdpCallEvent = new Map<
    // Most recent CDP call per session/root; `_sendViaSession()` refreshes it and later unsolicited messages reuse it as their parent anchor.
    string | null,
    {
      flowLoggerContext: FlowLoggerContext; // Flow context captured when the latest call on this session/root was emitted.
      cdpCallEvent: Pick<FlowEvent, "eventId" | "eventParentIds">; // Identity of that latest call event; unsolicited messages reuse it as their parent.
    }
  >();
  private eventHandlers = new Map<string, Set<EventHandler>>();
  private sessions = new Map<string, CdpSession>();
  /** Maps sessionId -> targetId (1:1 mapping) */
  private sessionToTarget = new Map<string, string>();
  private sessionDispatchWaiters = new Set<SessionDispatchWaiter>();
  public readonly id: string | null = null; // root
  private transportCloseHandlers = new Set<(why: string) => void>();

  public flowLoggerContext?: FlowLoggerContext; // Instance-owned fallback flow context; V3 sets this once and later sends/callbacks re-enter it when ALS is absent.

  public onTransportClosed(handler: (why: string) => void): void {
    this.transportCloseHandlers.add(handler);
  }
  public offTransportClosed(handler: (why: string) => void): void {
    this.transportCloseHandlers.delete(handler);
  }

  private emitTransportClosed(why: string) {
    for (const h of this.transportCloseHandlers) {
      try {
        h(why);
      } catch {
        //
      }
    }
  }

  private constructor(ws: WebSocket) {
    this.ws = ws;
    this.ws.on("close", (code, reason) => {
      // Reason is a Buffer in ws; stringify defensively
      const why = `socket-close code=${code} reason=${String(reason || "")}`;
      this.rejectAllInflight(why);
      this.emitTransportClosed(why);
    });

    this.ws.on("error", (err) => {
      const why = `socket-error ${err?.message ?? String(err)}`;
      this.rejectAllInflight(why);
      this.emitTransportClosed(why);
    });
    this.ws.on("message", (data) => this.onMessage(data.toString()));
  }

  static async connect(
    wsUrl: string,
    options?: { headers?: Record<string, string> },
  ): Promise<CdpConnection> {
    // Include User-Agent header for server-side observability and version tracking
    // Merge user-provided headers, letting them override defaults
    const headers = {
      "User-Agent": `Stagehand/${STAGEHAND_VERSION}`,
      ...options?.headers,
    };
    const ws = new WebSocket(wsUrl, { headers });
    await new Promise<void>((resolve, reject) => {
      ws.once("open", () => resolve());
      ws.once("error", (e) => reject(e));
    });
    return new CdpConnection(ws);
  }

  async enableAutoAttach(): Promise<void> {
    await this.send("Target.setAutoAttach", {
      autoAttach: true,
      flatten: true,
      waitForDebuggerOnStart: true,
    });
    await this.send("Target.setDiscoverTargets", { discover: true });
  }

  async send<R = unknown>(method: string, params?: object): Promise<R> {
    const id = this.nextId++;
    const payload = { id, method, params };
    const stack = new Error().stack?.split("\n").slice(1, 4).join("\n");
    const flowLoggerContext = FlowLogger.resolveContext(this.flowLoggerContext);
    const cdpCallEvent = flowLoggerContext
      ? FlowLogger.logCdpCallEvent(flowLoggerContext, {
          method,
          params,
          targetId: null,
        })
      : null;
    if (flowLoggerContext && cdpCallEvent) {
      this.latestCdpCallEvent.set(null, {
        flowLoggerContext,
        cdpCallEvent,
      });
    }
    const p = new Promise<R>((resolve, reject) => {
      this.inflight.set(id, {
        resolve,
        reject,
        sessionId: null,
        method,
        params,
        stack,
        ts: Date.now(),
        flowLoggerContext,
        cdpCallEvent,
      });
    });
    // Prevent unhandledRejection if a session detaches before the caller awaits.
    void p.catch(() => {});
    this.ws.send(JSON.stringify(payload));
    return p;
  }

  on<P = unknown>(event: string, handler: (params: P) => void): void {
    const set = this.eventHandlers.get(event) ?? new Set<EventHandler>();
    set.add(handler as EventHandler);
    this.eventHandlers.set(event, set);
  }

  off<P = unknown>(event: string, handler: (params: P) => void): void {
    const set = this.eventHandlers.get(event);
    if (set) set.delete(handler as EventHandler);
  }

  async close(): Promise<void> {
    if (this.ws.readyState === WebSocket.CLOSED) return;
    await new Promise<void>((resolve) => {
      this.ws.once("close", () => resolve());
      this.ws.close();
    });
  }

  private rejectAllInflight(why: string): void {
    for (const [id, entry] of this.inflight.entries()) {
      entry.reject(new CdpConnectionClosedError(why));
      this.inflight.delete(id);
    }
    this.latestCdpCallEvent.clear();
    for (const waiter of Array.from(this.sessionDispatchWaiters)) {
      waiter.reject(new CdpConnectionClosedError(why));
    }
  }

  getSession(sessionId: string): CdpSession | undefined {
    return this.sessions.get(sessionId);
  }

  waitForSessionDispatch(
    sessionId: string,
    method: string,
    match?: (params?: object) => boolean,
  ): Promise<void> {
    return new Promise<void>((resolve, reject) => {
      const waiter: SessionDispatchWaiter = {
        sessionId,
        method,
        match,
        resolve: () => {
          this.sessionDispatchWaiters.delete(waiter);
          resolve();
        },
        reject: (error: Error) => {
          this.sessionDispatchWaiters.delete(waiter);
          reject(error);
        },
      };
      this.sessionDispatchWaiters.add(waiter);
    });
  }

  async attachToTarget(targetId: string): Promise<CdpSession> {
    const { sessionId } = (await this.send<{ sessionId: string }>(
      "Target.attachToTarget",
      { targetId, flatten: true },
    )) as { sessionId: string };

    let session = this.sessions.get(sessionId);
    if (!session) {
      session = new CdpSession(this, sessionId);
      this.sessions.set(sessionId, session);
    }
    this.sessionToTarget.set(sessionId, targetId);
    return session;
  }

  async getTargets(): Promise<Protocol.Target.TargetInfo[]> {
    const res = await this.send<{
      targetInfos: Protocol.Target.TargetInfo[];
    }>("Target.getTargets");
    return res.targetInfos;
  }

  private onMessage(json: string): void {
    const msg = JSON.parse(json) as RawMessage;

    if ("id" in msg) {
      const rec = this.inflight.get(msg.id);
      if (!rec) return;

      this.inflight.delete(msg.id);

      if ("error" in msg && msg.error) {
        // Response/error events only make sense if the original send captured
        // both a flow context to re-enter and the emitted CdpCallEvent to hang
        // the terminal edge under.
        if (rec.flowLoggerContext && rec.cdpCallEvent) {
          let targetId: string | null;
          if (rec.sessionId) {
            const mappedTargetId = this.sessionToTarget.get(rec.sessionId);
            if (mappedTargetId) {
              targetId = mappedTargetId;
            } else {
              targetId = rec.sessionId;
            }
          } else {
            targetId = null;
          }
          FlowLogger.logCdpResponseEvent(
            rec.flowLoggerContext,
            rec.cdpCallEvent,
            {
              method: rec.method,
              error: `${msg.error.code} ${msg.error.message}`,
              targetId,
            },
          );
        }
        rec.reject(new Error(`${msg.error.code} ${msg.error.message}`));
      } else {
        // Successful responses reuse the same cached call context so the
        // response lands under the exact CdpCallEvent emitted at send time.
        if (rec.flowLoggerContext && rec.cdpCallEvent) {
          let targetId: string | null;
          if (rec.sessionId) {
            const mappedTargetId = this.sessionToTarget.get(rec.sessionId);
            if (mappedTargetId) {
              targetId = mappedTargetId;
            } else {
              targetId = rec.sessionId;
            }
          } else {
            targetId = null;
          }
          FlowLogger.logCdpResponseEvent(
            rec.flowLoggerContext,
            rec.cdpCallEvent,
            {
              method: rec.method,
              result: (msg as { result?: unknown }).result,
              targetId,
            },
          );
        }
        rec.resolve((msg as { result?: unknown }).result);
      }
      return;
    }

    if ("method" in msg) {
      if (msg.method === "Target.attachedToTarget") {
        const p = (msg as { params: Protocol.Target.AttachedToTargetEvent })
          .params;
        if (!this.sessions.has(p.sessionId)) {
          this.sessions.set(p.sessionId, new CdpSession(this, p.sessionId));
        }
        this.sessionToTarget.set(p.sessionId, p.targetInfo.targetId);
      } else if (msg.method === "Target.detachedFromTarget") {
        const p = (msg as { params: Protocol.Target.DetachedFromTargetEvent })
          .params;
        for (const [id, entry] of this.inflight.entries()) {
          if (entry.sessionId === p.sessionId) {
            entry.reject(
              new PageNotFoundError(
                `target closed before CDP response (sessionId=${p.sessionId}, targetId=${p.targetId})`,
              ),
            );
            this.inflight.delete(id);
          }
        }
        for (const waiter of Array.from(this.sessionDispatchWaiters)) {
          if (waiter.sessionId === p.sessionId) {
            waiter.reject(
              new PageNotFoundError(
                `target closed before CDP send (sessionId=${p.sessionId}, targetId=${p.targetId})`,
              ),
            );
          }
        }
        this.sessions.delete(p.sessionId);
        this.sessionToTarget.delete(p.sessionId);
        this.latestCdpCallEvent.delete(p.sessionId);
      } else if (msg.method === "Target.targetDestroyed") {
        const p = (msg as { params: { targetId: string } }).params;
        // Remove any session mapping for this target
        for (const [sessionId, targetId] of this.sessionToTarget.entries()) {
          if (targetId === p.targetId) {
            this.sessionToTarget.delete(sessionId);
            this.latestCdpCallEvent.delete(sessionId);
            break;
          }
        }
      }

      const { method, params, sessionId } = msg;
      const latestCdpCallEvent =
        this.latestCdpCallEvent.get(sessionId ?? null) ??
        (sessionId ? this.latestCdpCallEvent.get(null) : null);
      let targetId: string | null;
      if (sessionId) {
        const mappedTargetId = this.sessionToTarget.get(sessionId);
        if (mappedTargetId) {
          targetId = mappedTargetId;
        } else {
          targetId = sessionId;
        }
      } else {
        targetId = null;
      }

      // Unsolicited protocol messages are attached under the most recent call on
      // that session/root when one is known, so later callbacks still show up
      // in the same flow subtree.
      if (latestCdpCallEvent) {
        FlowLogger.logCdpMessageEvent(
          latestCdpCallEvent.flowLoggerContext,
          latestCdpCallEvent.cdpCallEvent,
          {
            method,
            params,
            targetId,
          },
        );
      }

      const dispatch = () => {
        if (sessionId) {
          const session = this.sessions.get(sessionId);
          session?.dispatch(method, params);

          // Forward target lifecycle events to root listeners as well.
          // Some browsers emit these via a parent session rather than the root
          // connection; fan-out keeps target tracking consistent.
          if (method.startsWith("Target.")) {
            const handlers = this.eventHandlers.get(method);
            if (handlers) for (const h of handlers) h(params);
          }
          return;
        }

        const handlers = this.eventHandlers.get(method);
        if (handlers) for (const h of handlers) h(params);
      };

      if (latestCdpCallEvent) {
        FlowLogger.withContext(latestCdpCallEvent.flowLoggerContext, dispatch);
      } else {
        dispatch();
      }
    }
  }

  _sendViaSession<R = unknown>(
    sessionId: string,
    method: string,
    params?: object,
  ): Promise<R> {
    const id = this.nextId++;
    const payload = { id, method, params, sessionId };
    const stack = new Error().stack?.split("\n").slice(1, 4).join("\n");
    const flowLoggerContext = FlowLogger.resolveContext(this.flowLoggerContext);
    let targetId: string | null;
    const mappedTargetId = this.sessionToTarget.get(sessionId);
    if (mappedTargetId) {
      targetId = mappedTargetId;
    } else {
      targetId = null;
    }
    const cdpCallEvent = flowLoggerContext
      ? FlowLogger.logCdpCallEvent(flowLoggerContext, {
          method,
          params,
          targetId,
        })
      : null;
    if (flowLoggerContext && cdpCallEvent) {
      this.latestCdpCallEvent.set(sessionId, {
        flowLoggerContext,
        cdpCallEvent,
      });
    }

    const p = new Promise<R>((resolve, reject) => {
      this.inflight.set(id, {
        resolve,
        reject,
        sessionId,
        method,
        params,
        stack,
        ts: Date.now(),
        flowLoggerContext,
        cdpCallEvent,
      });
    });
    // Prevent unhandledRejection if a session detaches before the caller awaits.
    void p.catch(() => {});
    for (const waiter of Array.from(this.sessionDispatchWaiters)) {
      if (waiter.sessionId !== sessionId) continue;
      if (waiter.method !== method) continue;
      if (waiter.match && !waiter.match(params)) continue;
      waiter.resolve();
      break;
    }
    this.ws.send(JSON.stringify(payload));
    return p;
  }

  _onSessionEvent(
    sessionId: string,
    event: string,
    handler: EventHandler,
  ): void {
    const key = `${sessionId}:${event}`;
    const set = this.eventHandlers.get(key) ?? new Set<EventHandler>();
    set.add(handler);
    this.eventHandlers.set(key, set);
  }

  _offSessionEvent(
    sessionId: string,
    event: string,
    handler: EventHandler,
  ): void {
    const key = `${sessionId}:${event}`;
    const set = this.eventHandlers.get(key);
    if (set) set.delete(handler);
  }

  _dispatchToSession(sessionId: string, event: string, params: unknown): void {
    const key = `${sessionId}:${event}`;
    const handlers = this.eventHandlers.get(key);
    if (handlers) for (const h of handlers) h(params);
  }
}

export class CdpSession implements CDPSessionLike {
  constructor(
    private readonly root: CdpConnection,
    public readonly id: string,
  ) {}

  send<R = unknown>(method: string, params?: object): Promise<R> {
    return this.root._sendViaSession<R>(this.id, method, params);
  }

  on<P = unknown>(event: string, handler: (params: P) => void): void {
    this.root._onSessionEvent(this.id, event, handler as EventHandler);
  }

  off<P = unknown>(event: string, handler: (params: P) => void): void {
    this.root._offSessionEvent(this.id, event, handler as EventHandler);
  }

  async close(): Promise<void> {
    await this.root.send<void>("Target.detachFromTarget", {
      sessionId: this.id,
    });
  }

  dispatch(event: string, params: unknown): void {
    this.root._dispatchToSession(this.id, event, params);
  }
}


================================================
FILE: packages/core/lib/v3/understudy/consoleMessage.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { Page } from "./page.js";

type RemoteObject = Protocol.Runtime.RemoteObject;

export type ConsoleListener = (message: ConsoleMessage) => void;

function formatRemoteObject(obj: RemoteObject | undefined): string {
  if (!obj) return "";

  if ("value" in obj) {
    const value = obj.value;
    if (value === undefined) return "";
    if (typeof value === "string") return value;
    try {
      return JSON.stringify(value);
    } catch {
      return String(value);
    }
  }

  if (obj.unserializableValue) return obj.unserializableValue;
  if (obj.description) return obj.description;

  return obj.type ?? "";
}

export class ConsoleMessage {
  constructor(
    private readonly event: Protocol.Runtime.ConsoleAPICalledEvent,
    private readonly pageRef?: Page,
  ) {}

  type(): Protocol.Runtime.ConsoleAPICalledEvent["type"] {
    return this.event.type;
  }

  text(): string {
    const args = this.args();
    if (!args.length) return "";
    return args
      .map((arg) => formatRemoteObject(arg))
      .filter((chunk) => chunk.length > 0)
      .join(" ");
  }

  args(): RemoteObject[] {
    return this.event.args ? [...this.event.args] : [];
  }

  location(): { url?: string; lineNumber?: number; columnNumber?: number } {
    const frame = this.event.stackTrace?.callFrames?.[0];
    return {
      url: frame?.url,
      lineNumber: frame?.lineNumber,
      columnNumber: frame?.columnNumber,
    };
  }

  page(): Page | undefined {
    return this.pageRef;
  }

  timestamp(): number | undefined {
    return this.event.timestamp;
  }

  raw(): Protocol.Runtime.ConsoleAPICalledEvent {
    return this.event;
  }

  toString(): string {
    return this.text();
  }
}


================================================
FILE: packages/core/lib/v3/understudy/context.ts
================================================
// lib/v3/understudy/context.ts
import type { Protocol } from "devtools-protocol";
import { v3Logger } from "../logger.js";
import { CdpConnection, CDPSessionLike } from "./cdp.js";
import { Page } from "./page.js";
import { installV3PiercerIntoSession } from "./piercer.js";
import { v3ScriptContent } from "../dom/build/scriptV3Content.js";
import { executionContexts } from "./executionContextRegistry.js";
import type { StagehandAPIClient } from "../api.js";
import { LocalBrowserLaunchOptions } from "../types/public/index.js";
import { InitScriptSource } from "../types/private/index.js";
import { normalizeInitScriptSource } from "./initScripts.js";
import {
  TimeoutError,
  CookieSetError,
  PageNotFoundError,
  StagehandSetExtraHTTPHeadersError,
} from "../types/public/sdkErrors.js";
import { getEnvTimeoutMs, withTimeout } from "../timeoutConfig.js";
import {
  filterCookies,
  normalizeCookieParams,
  cookieMatchesFilter,
  toCdpCookieParam,
} from "./cookies.js";
import {
  Cookie,
  ClearCookieOptions,
  CookieParam,
} from "../types/public/context.js";

type TargetId = string;
type SessionId = string;

type TargetType = "page" | "iframe" | string;

/**
 * Returns true when the target's URL points to a document with a real,
 * pierceable HTML DOM.  We allowlist the small set of schemes that carry
 * web content rather than trying to blacklist every internal browser scheme
 * (chrome://, chrome-extension://, devtools://, brave://, edge://, …).
 */
function hasInjectableDOM(url: string | undefined): boolean {
  if (!url || url === "") return true;
  if (
    url === "about:blank" ||
    url === "about:srcdoc" ||
    url.startsWith("about:blank#")
  )
    return true;
  if (url.startsWith("http://") || url.startsWith("https://")) return true;
  if (
    url.startsWith("data:") ||
    url.startsWith("blob:") ||
    url.startsWith("file://") ||
    url.startsWith("filesystem:")
  )
    return true;
  return false;
}

function isNonWebTarget(info: Protocol.Target.TargetInfo): boolean {
  return (
    (info.type !== "page" && info.type !== "iframe") ||
    !hasInjectableDOM(info.url)
  );
}

function isTopLevelPage(info: Protocol.Target.TargetInfo): boolean {
  const ti = info as unknown as { subtype?: string };
  return info.type === "page" && ti.subtype !== "iframe";
}

const DEFAULT_FIRST_TOP_LEVEL_PAGE_TIMEOUT_MS = 5000;
const CI_FIRST_TOP_LEVEL_PAGE_TIMEOUT_MS = 30000;
const FIRST_TOP_LEVEL_PAGE_TIMEOUT_ENV =
  "STAGEHAND_FIRST_TOP_LEVEL_PAGE_TIMEOUT_MS";
const WAIT_FOR_FIRST_TOP_LEVEL_PAGE_OPERATION =
  "waitForFirstTopLevelPage (no top-level Page)";

function getFirstTopLevelPageTimeoutMs(): number {
  return (
    getEnvTimeoutMs(FIRST_TOP_LEVEL_PAGE_TIMEOUT_ENV) ??
    (process.env.CI
      ? CI_FIRST_TOP_LEVEL_PAGE_TIMEOUT_MS
      : DEFAULT_FIRST_TOP_LEVEL_PAGE_TIMEOUT_MS)
  );
}

/**
 * V3Context
 *
 * Owns the root CDP connection and wires Target/Page events into Page.
 * Maintains one Page per top-level target, adopts OOPIF child sessions into the owner Page,
 * and tracks target→page and (root) frame→target mappings for lookups.
 *
 * IMPORTANT: FrameId → session ownership is managed inside Page (via its FrameRegistry).
 * Context never “guesses” owners; it simply forwards events (with the emitting session)
 * so Page can record the correct owner at event time.
 */
export class V3Context {
  private constructor(
    readonly conn: CdpConnection,
    private readonly env: "LOCAL" | "BROWSERBASE" = "LOCAL",
    private readonly apiClient: StagehandAPIClient | null = null,
    private readonly localBrowserLaunchOptions: LocalBrowserLaunchOptions | null = null,
  ) {}

  private readonly _piercerInstalled = new Set<string>();
  // Timestamp for most recent popup/open signal
  private _lastPopupSignalAt = 0;
  private readonly _targetSessionListeners = new Set<SessionId>();

  private readonly _sessionInit = new Set<SessionId>();
  private pagesByTarget = new Map<TargetId, Page>();
  private mainFrameToTarget = new Map<string, TargetId>();
  private sessionOwnerPage = new Map<SessionId, Page>();
  private frameOwnerPage = new Map<string, Page>();
  private pendingOopifByMainFrame = new Map<string, SessionId>();
  private createdAtByTarget = new Map<TargetId, number>();
  private typeByTarget = new Map<TargetId, TargetType>();
  private _pageOrder: TargetId[] = [];
  private pendingCreatedTargetUrl = new Map<TargetId, string>();
  private readonly initScripts: string[] = [];
  private extraHttpHeaders: Record<string, string> | null = null;

  private installTargetSessionListeners(session: CDPSessionLike): void {
    const sessionId = session.id;
    if (!sessionId) return;
    if (this._targetSessionListeners.has(sessionId)) return;
    this._targetSessionListeners.add(sessionId);

    session.on<Protocol.Target.AttachedToTargetEvent>(
      "Target.attachedToTarget",
      (evt) => {
        void this.onAttachedToTarget(evt.targetInfo, evt.sessionId);
      },
    );
    session.on<Protocol.Target.DetachedFromTargetEvent>(
      "Target.detachedFromTarget",
      (evt) => {
        this.onDetachedFromTarget(evt.sessionId, evt.targetId ?? null);
      },
    );
    session.on<Protocol.Target.TargetDestroyedEvent>(
      "Target.targetDestroyed",
      (evt) => {
        this.cleanupByTarget(evt.targetId);
      },
    );
  }

  /**
   * Create a Context for a given CDP websocket URL and bootstrap target wiring.
   */
  static async create(
    wsUrl: string,
    opts?: {
      env?: "LOCAL" | "BROWSERBASE";
      apiClient?: StagehandAPIClient | null;
      localBrowserLaunchOptions?: LocalBrowserLaunchOptions | null;
      cdpHeaders?: Record<string, string>;
    },
  ): Promise<V3Context> {
    const connectTask = async () => {
      const conn = await CdpConnection.connect(wsUrl, {
        headers: opts?.cdpHeaders,
      });
      const ctx = new V3Context(
        conn,
        opts?.env ?? "LOCAL",
        opts?.apiClient ?? null,
        opts?.localBrowserLaunchOptions ?? null,
      );
      await ctx.bootstrap();
      await ctx.ensureFirstTopLevelPage(getFirstTopLevelPageTimeoutMs());
      return ctx;
    };

    const cdpTimeoutMs =
      opts?.env === "BROWSERBASE"
        ? getEnvTimeoutMs("BROWSERBASE_CDP_CONNECT_MAX_MS")
        : undefined;

    if (cdpTimeoutMs) {
      let timedOut = false;
      const connectPromise = connectTask();
      const guarded = withTimeout(
        connectPromise,
        cdpTimeoutMs,
        "Browserbase CDP connect",
      ).catch((err) => {
        timedOut = true;
        throw err;
      });
      connectPromise
        .then((ctx) => {
          if (timedOut) void ctx.close();
        })
        .catch(() => {});
      return await guarded;
    }

    return await connectTask();
  }

  private hasTopLevelPage(): boolean {
    for (const [targetId, targetType] of this.typeByTarget) {
      if (targetType === "page" && this.pagesByTarget.has(targetId)) {
        return true;
      }
    }
    return false;
  }

  private async ensureFirstTopLevelPage(timeoutMs: number): Promise<void> {
    if (this.hasTopLevelPage()) return;

    try {
      await this.waitForFirstTopLevelPage(timeoutMs);
      return;
    } catch (err) {
      if (!(err instanceof TimeoutError)) {
        throw err;
      }
      v3Logger({
        category: "ctx",
        message:
          "No open browser pages found after connect; creating an initial about:blank page",
        level: 1,
      });
    }

    await this.newPage("about:blank");
  }

  /**
   * Wait until at least one top-level Page has been created and registered.
   * We poll internal maps that bootstrap/onAttachedToTarget populate.
   */
  private async waitForFirstTopLevelPage(timeoutMs: number): Promise<void> {
    const deadline = Date.now() + timeoutMs;
    while (Date.now() < deadline) {
      // A top-level Page is present if typeByTarget has an entry "page"
      // and pagesByTarget has the corresponding Page object.
      for (const [tid, ttype] of this.typeByTarget) {
        if (ttype === "page") {
          const p = this.pagesByTarget.get(tid);
          if (p) return;
        }
      }
      await new Promise((r) => setTimeout(r, 25));
    }
    throw new TimeoutError(WAIT_FOR_FIRST_TOP_LEVEL_PAGE_OPERATION, timeoutMs);
  }

  private async waitForInitialTopLevelTargets(
    targetIds: TargetId[],
    timeoutMs = 3000,
  ): Promise<void> {
    if (!targetIds.length) return;
    const pending = new Set(targetIds);
    const deadline = Date.now() + timeoutMs;
    while (pending.size && Date.now() < deadline) {
      for (const tid of Array.from(pending)) {
        if (this.pagesByTarget.has(tid)) {
          pending.delete(tid);
        }
      }
      if (!pending.size) return;
      await new Promise((r) => setTimeout(r, 25));
    }
    if (pending.size) {
      v3Logger({
        category: "ctx",
        message: "Timed out waiting for existing top-level targets to attach",
        level: 2,
        auxiliary: {
          remainingTargets: {
            value: JSON.stringify(Array.from(pending)),
            type: "object",
          },
        },
      });
    }
  }

  private async ensurePiercer(session: CDPSessionLike): Promise<boolean> {
    const id = session.id ?? "";
    if (this._piercerInstalled.has(id)) return true;

    const installed = await installV3PiercerIntoSession(session);
    if (installed) {
      this._piercerInstalled.add(id);
    }
    return installed;
  }

  /** Mark a page target as the most-recent one (active). */
  private _pushActive(tid: TargetId): void {
    // remove prior entry if any
    const i = this._pageOrder.indexOf(tid);
    if (i !== -1) this._pageOrder.splice(i, 1);
    this._pageOrder.push(tid);
  }

  /** Remove a page target from the recency list (used on close). */
  private _removeFromOrder(tid: TargetId): void {
    const i = this._pageOrder.indexOf(tid);
    if (i !== -1) this._pageOrder.splice(i, 1);
  }

  /** Return the current active Page (most-recent page that still exists). */
  public activePage(): Page | undefined {
    // prune any stale ids from the tail
    for (let i = this._pageOrder.length - 1; i >= 0; i--) {
      const tid = this._pageOrder[i]!;
      const p = this.pagesByTarget.get(tid);
      if (p) return p;
      // stale — remove and continue
      this._pageOrder.splice(i, 1);
    }
    // fallback: pick the newest by createdAt if order is empty
    let newestTid: TargetId | undefined;
    let newestTs = -1;
    for (const [tid] of this.pagesByTarget) {
      const ts = this.createdAtByTarget.get(tid) ?? 0;
      if (ts > newestTs) {
        newestTs = ts;
        newestTid = tid;
      }
    }
    return newestTid ? this.pagesByTarget.get(newestTid) : undefined;
  }

  /** Explicitly mark a known Page as the most-recent active page (and focus it). */
  public setActivePage(page: Page): void {
    let targetId = page.targetId();
    if (this.pagesByTarget.get(targetId) !== page) {
      const lookup = this.findTargetIdByPage(page);
      if (!lookup) {
        v3Logger({
          category: "ctx",
          message: "setActivePage called with unknown Page",
          level: 2,
          auxiliary: {
            targetId: { value: String(targetId), type: "string" },
          },
        });
        return;
      }
      targetId = lookup;
    }

    this._pushActive(targetId);

    // Bring the tab to the foreground in headful Chrome (best effort).
    void this.conn.send("Target.activateTarget", { targetId }).catch(() => {});
  }

  public async addInitScript<Arg>(
    script: InitScriptSource<Arg>,
    arg?: Arg,
  ): Promise<void> {
    const source = await normalizeInitScriptSource(script, arg);
    if (this.initScripts.includes(source)) return;
    this.initScripts.push(source);
    const pages = this.pages();
    await Promise.all(pages.map((page) => page.registerInitScript(source)));
  }

  public async setExtraHTTPHeaders(
    headers: Record<string, string>,
  ): Promise<void> {
    const nextHeaders = { ...headers };
    this.extraHttpHeaders = nextHeaders;

    const sessions: CDPSessionLike[] = [];
    for (const sessionId of this._sessionInit) {
      const session = this.conn.getSession(sessionId);
      if (session) sessions.push(session);
    }

    if (!sessions.length) return;

    const results = await Promise.allSettled(
      sessions.map(async (session) => {
        await session.send("Network.enable");
        await session.send("Network.setExtraHTTPHeaders", {
          headers: nextHeaders,
        });
      }),
    );

    const failures = results
      .map((result, index) => ({ result, session: sessions[index] }))
      .filter(
        (
          entry,
        ): entry is {
          result: PromiseRejectedResult;
          session: CDPSessionLike;
        } => entry.result.status === "rejected",
      )
      .map((entry) => {
        const reason = entry.result.reason as Error;
        const sid = entry.session.id ?? "unknown";
        const message = reason?.message ?? String(reason);
        return `session=${sid} error=${message}`;
      });

    if (failures.length) {
      throw new StagehandSetExtraHTTPHeadersError(failures);
    }
  }

  /**
   * Return top-level `Page`s (oldest → newest). OOPIF targets are not included.
   */
  pages(): Page[] {
    const rows: Array<{ tid: TargetId; page: Page; created: number }> = [];
    for (const [tid, page] of this.pagesByTarget) {
      if (this.typeByTarget.get(tid) === "page") {
        rows.push({ tid, page, created: this.createdAtByTarget.get(tid) ?? 0 });
      }
    }
    rows.sort((a, b) => a.created - b.created);
    return rows.map((r) => r.page);
  }

  private async applyInitScriptsToPage(
    page: Page,
    opts?: { seedOnly?: boolean },
  ): Promise<void> {
    if (opts?.seedOnly) {
      for (const source of this.initScripts) {
        page.seedInitScript(source);
      }
      return;
    }
    for (const source of this.initScripts) {
      await page.registerInitScript(source);
    }
  }

  /**
   * Resolve an owning `Page` by the **top-level main frame id**.
   * Note: child (OOPIF) roots are intentionally not present in this mapping.
   */
  resolvePageByMainFrameId(frameId: string): Page | undefined {
    const targetId = this.mainFrameToTarget.get(frameId);
    return targetId ? this.pagesByTarget.get(targetId) : undefined;
  }

  /**
   * Serialize the full frame tree for a given top-level main frame id.
   */
  async getFullFrameTreeByMainFrameId(
    rootMainFrameId: string,
  ): Promise<Protocol.Page.FrameTree> {
    const owner = this.resolvePageByMainFrameId(rootMainFrameId);
    if (!owner) throw new PageNotFoundError(`mainFrameId=${rootMainFrameId}`);
    return owner.asProtocolFrameTree(rootMainFrameId);
  }

  /**
   * Create a new top-level page (tab) with the given URL and return its Page object.
   * Waits until the target is attached and registered.
   */
  public async newPage(url = "about:blank"): Promise<Page> {
    const targetUrl = String(url ?? "about:blank");
    const { targetId } = await this.conn.send<{ targetId: string }>(
      "Target.createTarget",
      // Create at about:blank so init scripts can install before first real navigation.
      { url: "about:blank" },
    );
    this.pendingCreatedTargetUrl.set(targetId, "about:blank");
    // Best-effort bring-to-front
    await this.conn.send("Target.activateTarget", { targetId }).catch(() => {});

    const deadline = Date.now() + 5000;
    while (Date.now() < deadline) {
      const page = this.pagesByTarget.get(targetId);
      if (page) {
        // we created at about:blank; navigate only after attach so init scripts run
        // on the first real document. Fire-and-forget so newPage() resolves on attach.
        if (targetUrl !== "about:blank") {
          // Seed requested URL into the page cache before navigation events arrive.
          page.seedCurrentUrl(targetUrl);
          void page
            .sendCDP("Page.navigate", { url: targetUrl })
            .catch(() => {});
        }
        return page;
      }
      await new Promise((r) => setTimeout(r, 25));
    }
    throw new TimeoutError(`newPage: target not attached (${targetId})`, 5000);
  }

  /**
   * Close CDP and clear all mappings. Best-effort cleanup.
   */
  async close(): Promise<void> {
    await this.conn.close();
    this.pagesByTarget.clear();
    this.mainFrameToTarget.clear();
    this.sessionOwnerPage.clear();
    this.frameOwnerPage.clear();
    this.pendingOopifByMainFrame.clear();
    this.createdAtByTarget.clear();
    this.typeByTarget.clear();
    this.pendingCreatedTargetUrl.clear();
  }

  /**
   * Bootstrap target lifecycle:
   * - Attach to existing targets.
   * - Handle auto-attach events.
   * - Clean up on detach/destroy.
   */
  private async bootstrap(): Promise<void> {
    // Live attach via auto-attach (normal path)
    this.conn.on<Protocol.Target.AttachedToTargetEvent>(
      "Target.attachedToTarget",
      async (evt) => {
        await this.onAttachedToTarget(evt.targetInfo, evt.sessionId);
      },
    );

    // Live detach (clean up session from owner page & frame graph)
    this.conn.on<Protocol.Target.DetachedFromTargetEvent>(
      "Target.detachedFromTarget",
      (evt) => {
        this.onDetachedFromTarget(evt.sessionId, evt.targetId ?? null);
      },
    );

    // Destroyed targets (fallback cleanup by targetId)
    this.conn.on<Protocol.Target.TargetDestroyedEvent>(
      "Target.targetDestroyed",
      (evt) => {
        this.cleanupByTarget(evt.targetId);
      },
    );

    this.conn.on<Protocol.Target.TargetCreatedEvent>(
      "Target.targetCreated",
      async (evt) => {
        const info = evt.targetInfo;
        // Note popups to help activePage settle
        const ti = info;
        if (info.type === "page" && (ti?.openerId || ti?.openerFrameId)) {
          this._notePopupSignal();
        }
      },
    );

    // Only enable auto-attach after listeners are ready so replayed targets are captured.
    await this.conn.enableAutoAttach();

    const targets = await this.conn.getTargets();
    for (const t of targets) {
      if (t.attached) continue; // auto-attach already handled this target
      try {
        await this.conn.attachToTarget(t.targetId);
      } catch {
        // ignore attach race
      }
    }

    const topLevelTargetIds = targets
      .filter((t) => isTopLevelPage(t))
      .map((t) => t.targetId);
    await this.waitForInitialTopLevelTargets(topLevelTargetIds);
  }

  /**
   * Handle a newly attached target (top-level or potential OOPIF):
   * - Enable Page domain and lifecycle events.
   * - If top-level → create Page, wire listeners, resume.
   * - Else → probe child root frame id via `Page.getFrameTree` and adopt immediately
   *   if the parent is known; otherwise stage until parent `frameAttached`.
   * - Resume the target only after listeners are wired.
   */
  private async onAttachedToTarget(
    info: Protocol.Target.TargetInfo,
    sessionId: SessionId,
  ): Promise<void> {
    // Skip non-web targets (workers, chrome extensions, background pages, etc.).
    // They still need to be resumed so we don't leave them paused by
    // waitForDebuggerOnStart, but injecting the piercer into these targets
    // can throw or corrupt their internal state (e.g. Chrome's PDF viewer).
    if (isNonWebTarget(info)) {
      const session = this.conn.getSession(sessionId);
      if (session) {
        await session.send("Runtime.runIfWaitingForDebugger").catch(() => {});
      }
      return;
    }

    const session = this.conn.getSession(sessionId);
    if (!session) return;

    // Init guard
    if (this._sessionInit.has(sessionId)) return;
    this._sessionInit.add(sessionId);

    this.installTargetSessionListeners(session);

    // Register for Runtime events before enabling it so we don't miss initial contexts.
    executionContexts.attachSession(session);

    // Ensure we only resume once even if multiple code paths hit finally.
    let resumed = false;
    const resume = async (): Promise<void> => {
      if (resumed) return;
      resumed = true;
      // waitForDebuggerOnStart pauses new targets; resume once we've done
      // any "must happen before first document" work.
      await session.send("Runtime.runIfWaitingForDebugger").catch(() => {});
    };

    // Attach lifecycle (per target session):
    // 1) while paused, enable domains + child auto-attach and register init scripts;
    // 2) resume target execution;
    // 3) build/adopt Page ownership and frame bridges.
    // Some CDP backends defer *.enable() responses until after resume, so we
    // cannot await those responses before resuming. Instead we:
    // - wait for transport-level dispatch of required pre-resume commands;
    // - then dispatch resume;
    // - then await responses.
    const queuePreResume = (
      method: string,
      params?: object,
      match?: (sentParams?: object) => boolean,
    ) => {
      const dispatched = this.conn
        .waitForSessionDispatch(sessionId, method, match)
        .then(() => true)
        .catch(() => false);
      const response = session
        .send(method, params)
        .then(() => true)
        .catch(() => false);
      return { dispatched, response };
    };
    const initScriptOps: Array<{
      dispatched: Promise<boolean>;
      response: Promise<boolean>;
    }> = [];
    // Pre-resume ordering matters:
    // - enable domains;
    // - enable child auto-attach with waitForDebuggerOnStart;
    // - register init scripts.
    // Commands are sent in-order on the same session before resume.
    const corePreResumeOps = [
      queuePreResume("Page.enable"),
      queuePreResume("Runtime.enable"),
      queuePreResume("Target.setAutoAttach", {
        autoAttach: true,
        waitForDebuggerOnStart: true,
        flatten: true,
      }),
    ];
    const headerPreResumeOps: Array<{
      dispatched: Promise<boolean>;
      response: Promise<boolean>;
    }> = [];
    if (this.extraHttpHeaders) {
      const headers = { ...this.extraHttpHeaders };
      headerPreResumeOps.push(queuePreResume("Network.enable"));
      headerPreResumeOps.push(
        queuePreResume("Network.setExtraHTTPHeaders", { headers }),
      );
    }
    // Send init scripts only after auto-attach has been queued.
    if (this.initScripts.length) {
      for (const source of this.initScripts) {
        initScriptOps.push(
          queuePreResume(
            "Page.addScriptToEvaluateOnNewDocument",
            {
              source,
              runImmediately: true,
            },
            (sentParams) =>
              (sentParams as { source?: string } | undefined)?.source ===
              source,
          ),
        );
      }
    }
    const piercerPreloadOp = queuePreResume(
      "Page.addScriptToEvaluateOnNewDocument",
      {
        source: v3ScriptContent,
        runImmediately: true,
      },
      (sentParams) =>
        (sentParams as { source?: string } | undefined)?.source ===
        v3ScriptContent,
    );
    const preResumeDispatched = (
      await Promise.all([
        ...corePreResumeOps.map((op) => op.dispatched),
        ...headerPreResumeOps.map((op) => op.dispatched),
        ...initScriptOps.map((op) => op.dispatched),
        piercerPreloadOp.dispatched,
      ])
    ).every(Boolean);
    // Dispatch resume only after pre-resume setup has actually been sent.
    const resumeOp = queuePreResume("Runtime.runIfWaitingForDebugger");
    const [resumedDispatched, resumedOk] = await Promise.all([
      resumeOp.dispatched,
      resumeOp.response,
    ]);
    const [
      coreResults,
      headerResults,
      initScriptResults,
      piercerPreRegistered,
    ] = await Promise.all([
      Promise.all(corePreResumeOps.map((op) => op.response)),
      Promise.all(headerPreResumeOps.map((op) => op.response)),
      Promise.all(initScriptOps.map((op) => op.response)),
      piercerPreloadOp.response,
    ]);
    // Header propagation is independent of init-script determinism but still
    // part of pre-resume attach setup; awaited above for ordering/lifecycle.
    void headerResults;
    if (!preResumeDispatched || !resumedDispatched || !resumedOk) {
      // Short-lived child targets can detach before resume is acknowledged.
      // Keep this noisy only for top-level pages where missing attach is fatal.
      if (isTopLevelPage(info)) {
        v3Logger({
          category: "ctx",
          message: "Failed target pre-resume setup ordering",
          level: 2,
          auxiliary: {
            targetId: { value: String(info.targetId), type: "string" },
            targetType: { value: String(info.type), type: "string" },
            preResumeDispatched: {
              value: String(preResumeDispatched),
              type: "string",
            },
            resumedDispatched: {
              value: String(resumedDispatched),
              type: "string",
            },
            resumedOk: { value: String(resumedOk), type: "string" },
          },
        });
      }
      return;
    }
    resumed = true;
    const scriptsInstalled =
      coreResults.every(Boolean) && initScriptResults.every(Boolean);

    try {
      // Best-effort lifecycle events; do not block top-level page registration
      // on this optional signal stream.
      void session
        .send("Page.setLifecycleEventsEnabled", { enabled: true })
        .catch(() => {});

      // Top-level handling
      if (isTopLevelPage(info)) {
        let page: Page | null = null;
        let createError: unknown;
        // Deterministic contract: never drop a newly attached top-level target
        // because an arbitrary local timeout fired. We wait for Page.create and
        // let it finish regardless of CDP call latency.
        try {
          page = await Page.create(
            this.conn,
            session,
            info.targetId,
            this.apiClient,
            this.localBrowserLaunchOptions,
            this.env === "BROWSERBASE",
          );
        } catch (error) {
          createError = error;
        }
        if (!page) {
          v3Logger({
            category: "ctx",
            message: "Failed to create top-level Page",
            level: 2,
            auxiliary: {
              targetId: { value: String(info.targetId), type: "string" },
              targetType: { value: String(info.type), type: "string" },
              targetUrl: { value: String(info.url ?? ""), type: "string" },
              error: {
                value: String(
                  createError instanceof Error
                    ? createError.message
                    : createError,
                ),
                type: "string",
              },
            },
          });
          return;
        }
        this.wireSessionToOwnerPage(sessionId, page);
        this.pagesByTarget.set(info.targetId, page);
        this.mainFrameToTarget.set(page.mainFrameId(), info.targetId);
        this.sessionOwnerPage.set(sessionId, page);
        this.frameOwnerPage.set(page.mainFrameId(), page);
        this.typeByTarget.set(info.targetId, "page");
        if (!this.createdAtByTarget.has(info.targetId)) {
          this.createdAtByTarget.set(info.targetId, Date.now());
        }
        const pendingSeedUrl = this.pendingCreatedTargetUrl.get(info.targetId);
        this.pendingCreatedTargetUrl.delete(info.targetId);
        page.seedCurrentUrl(pendingSeedUrl ?? info.url ?? "");
        this._pushActive(info.targetId);
        this.installFrameEventBridges(sessionId, page);
        if (piercerPreRegistered) {
          this._piercerInstalled.add(sessionId);
        }
        // If we already installed scripts at the session level, only seed the
        // Page's registry to avoid double-installing DOMContentLoaded handlers.
        await this.applyInitScriptsToPage(page, {
          seedOnly: scriptsInstalled,
        });
        if (!piercerPreRegistered) {
          void this.ensurePiercer(session).catch(() => {});
        }

        return;
      }

      const piercerReady = await this.ensurePiercer(session).catch(() => false);
      if (!piercerReady) return;

      // Child (iframe / OOPIF)
      try {
        const { frameTree } =
          await session.send<Protocol.Page.GetFrameTreeResponse>(
            "Page.getFrameTree",
          );
        const childMainId = frameTree.frame.id;

        // Try to find owner Page now (it may already have the node in its tree)
        let owner = this.frameOwnerPage.get(childMainId);
        if (!owner) {
          for (const p of this.pagesByTarget.values()) {
            const tree = p.asProtocolFrameTree(p.mainFrameId());
            const has = (function find(n: Protocol.Page.FrameTree): boolean {
              if (n.frame.id === childMainId) return true;
              for (const c of n.childFrames ?? []) if (find(c)) return true;
              return false;
            })(tree);
            if (has) {
              owner = p;
              break;
            }
          }
        }

        if (owner) {
          owner.adoptOopifSession(session, childMainId);
          this.sessionOwnerPage.set(sessionId, owner);
          this.installFrameEventBridges(sessionId, owner);
          // Prime the execution-context registry so later lookups succeed even if
          // the frame navigates before we issue a command.
          void executionContexts
            .waitForMainWorld(session, childMainId)
            .catch(() => {});
        } else {
          this.pendingOopifByMainFrame.set(childMainId, sessionId);
        }
      } catch {
        // page.getFrameTree failed. Most likely was an ad iframe
        // that opened & closed before we could attach. ignore
      }
    } finally {
      await resume();
    }
  }

  /**
   * Detach handler:
   * - Remove child session ownership and prune its subtree.
   * - If a top-level target, cleanup its `Page` and mappings.
   * - Drop any staged child for this session.
   */
  private onDetachedFromTarget(
    sessionId: SessionId,
    targetId: string | null,
  ): void {
    const owner = this.sessionOwnerPage.get(sessionId);
    if (owner) {
      owner.detachOopifSession(sessionId);
      this.sessionOwnerPage.delete(sessionId);
    }

    if (targetId && this.pagesByTarget.has(targetId)) {
      this.cleanupByTarget(targetId);
    }

    for (const [fid, sid] of Array.from(
      this.pendingOopifByMainFrame.entries(),
    )) {
      if (sid === sessionId) this.pendingOopifByMainFrame.delete(fid);
    }

    this._targetSessionListeners.delete(sessionId);
    this._sessionInit.delete(sessionId);
    this._piercerInstalled.delete(sessionId);
  }

  /**
   * Cleanup a top-level Page by target id, removing its root and staged children.
   */
  private cleanupByTarget(targetId: TargetId): void {
    const page = this.pagesByTarget.get(targetId);
    if (!page) return;

    const mainId = page.mainFrameId();
    this.mainFrameToTarget.delete(mainId);
    this.frameOwnerPage.delete(mainId);

    for (const [sid, p] of Array.from(this.sessionOwnerPage.entries())) {
      if (p === page) this.sessionOwnerPage.delete(sid);
    }

    for (const [fid] of Array.from(this.pendingOopifByMainFrame.entries())) {
      const owner = this.frameOwnerPage.get(fid);
      if (!owner || owner === page) this.pendingOopifByMainFrame.delete(fid);
    }

    this._removeFromOrder(targetId);
    this.pagesByTarget.delete(targetId);
    this.createdAtByTarget.delete(targetId);
    this.typeByTarget.delete(targetId);
    this.pendingCreatedTargetUrl.delete(targetId);
  }

  /**
   * Wire Page-domain frame events for a session into the owning Page & mappings.
   * We forward the *emitting session* with every event so Page can stamp ownership precisely.
   */
  private installFrameEventBridges(sessionId: SessionId, owner: Page): void {
    const session = this.conn.getSession(sessionId);
    if (!session) return;

    session.on<Protocol.Page.FrameAttachedEvent>(
      "Page.frameAttached",
      (evt) => {
        const { frameId, parentFrameId } = evt;

        owner.onFrameAttached(frameId, parentFrameId ?? null, session);

        // If we were waiting for this id (OOPIF child), adopt now.
        const pendingChildSessionId = this.pendingOopifByMainFrame.get(frameId);
        if (pendingChildSessionId) {
          const child = this.conn.getSession(pendingChildSessionId);
          if (child) {
            owner.adoptOopifSession(child, frameId);
            this.sessionOwnerPage.set(child.id, owner);
            // Wire bridges for the child so its Page events keep flowing.
            this.installFrameEventBridges(pendingChildSessionId, owner);
          }
          this.pendingOopifByMainFrame.delete(frameId);
        }

        // Track Page ownership for quick reverse lookups (debug helpers).
        this.frameOwnerPage.set(frameId, owner);

        // Root handoff: keep mainFrameToTarget aligned for the page
        if (!parentFrameId) {
          const newRoot = owner.mainFrameId();
          const topTargetId = this.findTargetIdByPage(owner);
          if (topTargetId) {
            this.mainFrameToTarget.set(newRoot, topTargetId);
          }
          this.frameOwnerPage.set(newRoot, owner);
        }
      },
    );

    session.on<Protocol.Page.FrameDetachedEvent>(
      "Page.frameDetached",
      (evt) => {
        owner.onFrameDetached(evt.frameId, evt.reason ?? "remove");
        if (evt.reason !== "swap") {
          this.frameOwnerPage.delete(evt.frameId);
        }
      },
    );

    session.on<Protocol.Page.FrameNavigatedEvent>(
      "Page.frameNavigated",
      (evt) => {
        owner.onFrameNavigated(evt.frame, session);
      },
    );

    session.on<Protocol.Page.NavigatedWithinDocumentEvent>(
      "Page.navigatedWithinDocument",
      (evt) => {
        owner.onNavigatedWithinDocument(evt.frameId, evt.url, session);
      },
    );

    // Observe window.open to anticipate default page changes
    session.on<Protocol.Page.WindowOpenEvent>("Page.windowOpen", () => {
      this._notePopupSignal();
    });
  }

  /**
   * Register that a session belongs to a Page (used by event routing).
   */
  private wireSessionToOwnerPage(sessionId: SessionId, owner: Page): void {
    this.sessionOwnerPage.set(sessionId, owner);
  }

  /**
   * Utility: reverse-lookup the top-level target id that owns a given Page.
   */
  private findTargetIdByPage(page: Page): TargetId | undefined {
    for (const [tid, p] of this.pagesByTarget) {
      if (p === page) return tid;
    }
    return undefined;
  }

  private _notePopupSignal(): void {
    this._lastPopupSignalAt = Date.now();
  }

  /**
   * Await the current active page, waiting briefly if a popup/open was just triggered.
   * Normal path returns immediately; popup path waits up to timeoutMs for the new page.
   */
  async awaitActivePage(timeoutMs?: number): Promise<Page> {
    const defaultTimeout = this.env === "BROWSERBASE" ? 4000 : 2000;
    timeoutMs = timeoutMs ?? defaultTimeout;
    // If a popup was just triggered, Chrome (especially on Browserbase)
    // may briefly pause new targets at document start ("waiting for debugger").
    const recentWindowMs = this.env === "BROWSERBASE" ? 1000 : 300;
    const now = Date.now();
    const hasRecentPopup = now - this._lastPopupSignalAt <= recentWindowMs;

    const immediate = this.activePage();
    if (!hasRecentPopup && immediate) return immediate;

    const deadline = now + timeoutMs;
    while (Date.now() < deadline) {
      // Prefer most-recent by createdAt
      let newestTid: TargetId | undefined;
      let newestTs = -1;
      for (const [tid] of this.pagesByTarget) {
        const ts = this.createdAtByTarget.get(tid) ?? 0;
        if (ts > newestTs) {
          newestTs = ts;
          newestTid = tid;
        }
      }
      if (newestTid) {
        const p = this.pagesByTarget.get(newestTid);
        if (p && newestTs >= this._lastPopupSignalAt) return p;
      }
      await new Promise((r) => setTimeout(r, 25));
    }
    if (immediate) return immediate;
    throw new PageNotFoundError("awaitActivePage: no page available");
  }

  /**
   * Get all browser cookies, optionally filtered by URL(s).
   *
   * When `urls` is omitted or empty every cookie in the browser context is
   * returned. When one or more URLs are supplied only cookies whose
   * domain/path/secure attributes match are included.
   */
  async cookies(urls?: string | string[]): Promise<Cookie[]> {
    const urlList = !urls ? [] : typeof urls === "string" ? [urls] : urls;

    const { cookies } = await this.conn.send<{
      cookies: Protocol.Network.Cookie[];
    }>("Storage.getCookies");

    const mapped: Cookie[] = cookies.map((c) => ({
      name: c.name,
      value: c.value,
      domain: c.domain,
      path: c.path,
      expires: c.expires,
      httpOnly: c.httpOnly,
      secure: c.secure,
      sameSite: (c.sameSite as Cookie["sameSite"]) ?? "Lax",
    }));

    return filterCookies(mapped, urlList);
  }

  /**
   * Add one or more cookies to the browser context.
   *
   * Each cookie must specify either a `url` (from which domain/path/secure are
   * derived) or an explicit `domain` + `path` pair.
   *
   * We surface CDP errors if the browser rejects a cookie.
   */
  async addCookies(cookies: CookieParam[]): Promise<void> {
    const normalized = normalizeCookieParams(cookies);
    if (!normalized.length) return;

    const cdpCookies = normalized.map(toCdpCookieParam);

    try {
      await this.conn.send("Storage.setCookies", { cookies: cdpCookies });
    } catch (err) {
      const detail = err instanceof Error ? err.message : String(err);
      const names = normalized.map((c) => `"${c.name}"`).join(", ");
      throw new CookieSetError(
        `Failed to set cookies [${names}] — ` +
          `the browser rejected the batch. Check that the domain, path, and secure/sameSite values are valid.` +
          (detail ? ` (CDP error: ${detail})` : ""),
      );
    }
  }

  /**
   * Clear cookies from the browser context.
   *
   * - Called with no arguments: clears **all** cookies atomically via
   *   `Storage.clearCookies`.
   * - Called with filter options: fetches all cookies, clears everything,
   *   then re-adds only the cookies that do NOT match the filter via
   *   `Storage.setCookies`. This is necessary on the browser endpoint because
   *   the Storage domain does not support targeted deletes.
   */
  async clearCookies(options?: ClearCookieOptions): Promise<void> {
    const hasFilter =
      options?.name !== undefined ||
      options?.domain !== undefined ||
      options?.path !== undefined;

    if (!hasFilter) {
      // Atomic single-call wipe — no race condition, no O(N) roundtrips.
      await this.conn.send("Storage.clearCookies");
      return;
    }

    const current = await this.cookies();
    const toKeep = current.filter((c) => !cookieMatchesFilter(c, options!));

    if (toKeep.length === current.length) return;

    // Storage domain doesn't support targeted deletes on the browser endpoint.
    // Clear everything, then re-add only the cookies we're keeping.
    await this.conn.send("Storage.clearCookies");
    if (toKeep.length) {
      try {
        await this.conn.send("Storage.setCookies", {
          cookies: toKeep.map(toCdpCookieParam),
        });
      } catch (err) {
        const detail = err instanceof Error ? err.message : String(err);
        const names = toKeep.map((c) => `"${c.name}"`).join(", ");
        throw new CookieSetError(
          `clearCookies: cookies were cleared but failed to re-add the ${toKeep.length} ` +
            `non-matching cookie(s) [${names}]. The browser cookie jar is now empty. ` +
            (detail ? `(CDP error: ${detail})` : ""),
        );
      }
    }
  }
}


================================================
FILE: packages/core/lib/v3/understudy/cookies.ts
================================================
import {
  Cookie,
  CookieParam,
  ClearCookieOptions,
} from "../types/public/context.js";
import { CookieValidationError } from "../types/public/sdkErrors.js";

/**
 * helpers for browser cookie management.
 *
 * Mirrors Playwright's cookie API surface, adapted for direct CDP usage
 * against a single default browser context.
 */

/**
 * Filter cookies by URL matching (domain, path, secure).
 * If `urls` is empty every cookie passes.
 */
export function filterCookies(cookies: Cookie[], urls: string[]): Cookie[] {
  if (!urls.length) return cookies;
  const parsed = urls.map((u) => {
    try {
      return new URL(u);
    } catch {
      throw new CookieValidationError(
        `Invalid URL passed to cookies(): "${u}"`,
      );
    }
  });
  return cookies.filter((c) => {
    for (const url of parsed) {
      let domain = c.domain;
      if (!domain.startsWith(".")) domain = "." + domain;
      if (!("." + url.hostname).endsWith(domain)) continue;
      // Path must match on a "/" boundary: cookie path "/foo" should match
      // "/foo" and "/foo/bar" but NOT "/foobar".
      const p = url.pathname;
      if (
        !p.startsWith(c.path) ||
        (c.path.length < p.length &&
          !c.path.endsWith("/") &&
          p[c.path.length] !== "/")
      )
        continue;
      const isLoopback =
        url.hostname === "localhost" ||
        url.hostname === "127.0.0.1" ||
        url.hostname === "[::1]";
      if (url.protocol !== "https:" && !isLoopback && c.secure) continue;
      return true;
    }
    return false;
  });
}

/**
 * Validate and normalise `CookieParam` values before sending to CDP.
 *
 * - Ensures every cookie has either `url` or `domain`+`path`.
 * - When `url` is provided, derives `domain`, `path`, and `secure` from it.
 * - Validates that `sameSite: "None"` is paired with `secure: true`
 *   (browsers silently reject this — we throw early with a clear message).
 */
export function normalizeCookieParams(cookies: CookieParam[]): CookieParam[] {
  return cookies.map((c) => {
    if (!c.url && !(c.domain && c.path)) {
      throw new CookieValidationError(
        `Cookie "${c.name}" must have a url or a domain/path pair`,
      );
    }
    if (c.url && c.domain) {
      throw new CookieValidationError(
        `Cookie "${c.name}" should have either url or domain, not both`,
      );
    }
    if (c.url && c.path) {
      throw new CookieValidationError(
        `Cookie "${c.name}" should have either url or path, not both`,
      );
    }
    if (c.expires !== undefined && c.expires < 0 && c.expires !== -1) {
      throw new CookieValidationError(
        `Cookie "${c.name}" has an invalid expires value; use -1 for session cookies or a positive unix timestamp`,
      );
    }

    const copy = { ...c };
    if (copy.url) {
      if (copy.url === "about:blank") {
        throw new CookieValidationError(
          `Blank page cannot have cookie "${c.name}"`,
        );
      }
      if (copy.url.startsWith("data:")) {
        throw new CookieValidationError(
          `Data URL page cannot have cookie "${c.name}"`,
        );
      }
      let url: URL;
      try {
        url = new URL(copy.url);
      } catch {
        throw new CookieValidationError(
          `Cookie "${c.name}" has an invalid url: "${copy.url}"`,
        );
      }
      copy.domain = url.hostname;
      copy.path = url.pathname.substring(0, url.pathname.lastIndexOf("/") + 1);
      copy.secure = url.protocol === "https:";
      delete copy.url;
    }

    // Browsers silently reject SameSite=None cookies that aren't Secure.
    // Catch this early with a clear error instead of a silent CDP failure.
    // Use !copy.secure to catch both explicit false AND undefined (omitted),
    // since CDP defaults secure to false when omitted.
    if (copy.sameSite === "None" && !copy.secure) {
      throw new CookieValidationError(
        `Cookie "${c.name}" has sameSite: "None" without secure: true. ` +
          `Browsers require secure: true when sameSite is "None".`,
      );
    }

    return copy;
  });
}

/**
 * Map a Cookie or CookieParam to the shape CDP's Storage.setCookies expects.
 * Session cookies (expires === -1) omit the expires field so CDP treats them
 * as session-scoped.
 */
export function toCdpCookieParam(
  c: Cookie | CookieParam,
): Record<string, unknown> {
  return {
    name: c.name,
    value: c.value,
    domain: c.domain,
    path: c.path,
    expires: c.expires === -1 ? undefined : c.expires,
    httpOnly: c.httpOnly,
    secure: c.secure,
    sameSite: c.sameSite,
  };
}

/**
 * Returns true if a cookie matches all supplied filter criteria.
 * Undefined filters are treated as "match anything".
 */
export function cookieMatchesFilter(
  cookie: Cookie,
  options: ClearCookieOptions,
): boolean {
  const check = (
    prop: "name" | "domain" | "path",
    value: string | RegExp | undefined,
  ): boolean => {
    if (value === undefined) return true;
    if (value instanceof RegExp) {
      value.lastIndex = 0;
      return value.test(cookie[prop]);
    }
    return cookie[prop] === value;
  };
  return (
    check("name", options.name) &&
    check("domain", options.domain) &&
    check("path", options.path)
  );
}


================================================
FILE: packages/core/lib/v3/understudy/deepLocator.ts
================================================
import { Locator } from "./locator.js";
import type { Frame } from "./frame.js";
import type { Page } from "./page.js";
import { FrameLocator, frameLocatorFromFrame } from "./frameLocator.js";
import { StagehandInvalidArgumentError } from "../types/public/sdkErrors.js";
import { IFRAME_STEP_RE } from "./a11y/snapshot/focusSelectors.js";

type Axis = "child" | "desc";
type Step = { axis: Axis; raw: string; name: string };

export type ResolvedLocatorTarget = {
  frame: Frame;
  selector: string;
};

/** Parse XPath into steps preserving '/' vs '//' and the raw token (with [n]) */
function parseXPath(path: string): Step[] {
  const s = path.trim();
  let i = 0;
  const steps: Step[] = [];
  while (i < s.length) {
    let axis: Axis = "child";
    if (s.startsWith("//", i)) {
      axis = "desc";
      i += 2;
    } else if (s[i] === "/") {
      axis = "child";
      i += 1;
    }

    const start = i;
    while (i < s.length && s[i] !== "/") i++;
    const raw = s.slice(start, i).trim();
    if (!raw) continue;

    const name = raw.replace(/\[\d+\]\s*$/u, "").toLowerCase();
    steps.push({ axis, raw, name });
  }
  return steps;
}

function buildXPathFromSteps(steps: ReadonlyArray<Step>): string {
  let out = "";
  for (const st of steps) {
    out += st.axis === "desc" ? "//" : "/";
    out += st.raw; // keep predicates intact
  }
  return out || "/";
}

/** Build a Locator scoped to the correct frame for a deep XPath crossing iframes. */
export async function deepLocatorThroughIframes(
  page: Page,
  root: Frame,
  xpathOrSelector: string,
): Promise<Locator> {
  const target = await resolveDeepXPathTarget(page, root, xpathOrSelector);
  return new Locator(target.frame, target.selector);
}

/**
 * Unified resolver that supports '>>' hop notation, deep XPath across iframes,
 * and plain single-frame selectors. Keeps hop logic in one shared place.
 */
export async function resolveLocatorTarget(
  page: Page,
  root: Frame,
  selectorRaw: string,
): Promise<ResolvedLocatorTarget> {
  const sel = selectorRaw.trim();
  const parts = sel
    .split(">>")
    .map((s) => s.trim())
    .filter(Boolean);

  if (parts.length > 1) {
    // Build a FrameLocator chain for all but the last segment
    let fl = frameLocatorFromFrame(page, root, parts[0]!);
    for (let i = 1; i < parts.length - 1; i++) {
      fl = fl.frameLocator(parts[i]!);
    }
    const targetFrame = await fl.resolveFrame();
    return { frame: targetFrame, selector: parts[parts.length - 1]! };
  }

  // No hops — delegate to XPath-aware deep resolver when needed
  const isXPath = sel.startsWith("xpath=") || sel.startsWith("/");
  if (isXPath) {
    return resolveDeepXPathTarget(page, root, sel);
  }
  return { frame: root, selector: sel };
}

export async function resolveLocatorWithHops(
  page: Page,
  root: Frame,
  selectorRaw: string,
): Promise<Locator> {
  const target = await resolveLocatorTarget(page, root, selectorRaw);
  return new Locator(target.frame, target.selector);
}

/**
 * DeepLocatorDelegate: a lightweight wrapper that looks like a Locator and
 * resolves to the correct frame/element on each call using hop/deep-XPath logic.
 *
 * Returned by `page.deepLocator()` for ergonomic, await-free chaining:
 *   page.deepLocator('iframe#ifrA >> #btn').click()
 */
export class DeepLocatorDelegate {
  constructor(
    private readonly page: Page,
    private readonly root: Frame,
    private readonly selector: string,
    private readonly nthIndex: number = 0,
  ) {}

  private async real(): Promise<Locator> {
    const base = await resolveLocatorWithHops(
      this.page,
      this.root,
      this.selector,
    );
    return base.nth(this.nthIndex);
  }

  // Locator API delegates
  async click(options?: {
    button?: "left" | "right" | "middle";
    clickCount?: number;
  }) {
    return (await this.real()).click(options);
  }
  async count() {
    return (await this.real()).count();
  }
  async hover() {
    return (await this.real()).hover();
  }
  async fill(value: string) {
    return (await this.real()).fill(value);
  }
  async type(text: string, options?: { delay?: number }) {
    return (await this.real()).type(text, options);
  }
  async selectOption(values: string | string[]) {
    return (await this.real()).selectOption(values);
  }
  async scrollTo(percent: number | string) {
    return (await this.real()).scrollTo(percent);
  }
  async isVisible() {
    return (await this.real()).isVisible();
  }
  async isChecked() {
    return (await this.real()).isChecked();
  }
  async inputValue() {
    return (await this.real()).inputValue();
  }
  async textContent() {
    return (await this.real()).textContent();
  }
  async innerHtml() {
    return (await this.real()).innerHtml();
  }
  async innerText() {
    return (await this.real()).innerText();
  }
  async centroid() {
    return (await this.real()).centroid();
  }
  async backendNodeId() {
    return (await this.real()).backendNodeId();
  }
  async highlight(options?: {
    durationMs?: number;
    borderColor?: { r: number; g: number; b: number; a?: number };
    contentColor?: { r: number; g: number; b: number; a?: number };
  }) {
    return (await this.real()).highlight(options);
  }
  async sendClickEvent(options?: {
    bubbles?: boolean;
    cancelable?: boolean;
    composed?: boolean;
    detail?: number;
  }) {
    return (await this.real()).sendClickEvent(options);
  }
  async setInputFiles(
    files:
      | string
      | string[]
      | {
          name: string;
          mimeType: string;
          buffer: ArrayBuffer | Uint8Array | Buffer | string;
        }
      | Array<{
          name: string;
          mimeType: string;
          buffer: ArrayBuffer | Uint8Array | Buffer | string;
        }>,
  ) {
    return (await this.real()).setInputFiles(files);
  }
  first() {
    return this.nth(0);
  }
  nth(index: number): DeepLocatorDelegate {
    const value = Number(index);
    if (!Number.isFinite(value) || value < 0) {
      throw new StagehandInvalidArgumentError(
        "deepLocator().nth() expects a non-negative index",
      );
    }

    const nextIndex = Math.floor(value);
    if (nextIndex === this.nthIndex) return this;

    return new DeepLocatorDelegate(
      this.page,
      this.root,
      this.selector,
      nextIndex,
    );
  }
}

/** Factory to create a deep locator delegate from a Page + root frame. */
export function deepLocatorFromPage(
  page: Page,
  root: Frame,
  selector: string,
): DeepLocatorDelegate {
  return new DeepLocatorDelegate(page, root, selector);
}

async function resolveDeepXPathTarget(
  page: Page,
  root: Frame,
  xpathOrSelector: string,
): Promise<ResolvedLocatorTarget> {
  let path = xpathOrSelector.trim();
  if (path.startsWith("xpath=")) path = path.slice("xpath=".length).trim();
  if (!path.startsWith("/")) path = "/" + path;

  const steps = parseXPath(path);
  let fl: FrameLocator | undefined;
  let buf: Step[] = [];

  const flushIntoFrameLocator = () => {
    if (!buf.length) return;
    const selectorForIframe = "xpath=" + buildXPathFromSteps(buf);
    fl = fl
      ? fl.frameLocator(selectorForIframe)
      : frameLocatorFromFrame(page, root, selectorForIframe);
    buf = [];
  };

  for (const st of steps) {
    buf.push(st);
    if (IFRAME_STEP_RE.test(st.name)) flushIntoFrameLocator();
  }

  const finalSelector = "xpath=" + buildXPathFromSteps(buf);
  const targetFrame = fl ? await fl.resolveFrame() : root;
  return { frame: targetFrame, selector: finalSelector };
}


================================================
FILE: packages/core/lib/v3/understudy/executionContextRegistry.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "./cdp.js";

type FrameId = Protocol.Page.FrameId;
type ExecId = Protocol.Runtime.ExecutionContextId;

export class ExecutionContextRegistry {
  private readonly byFrame = new WeakMap<
    CDPSessionLike,
    Map<FrameId, ExecId>
  >();
  private readonly byExec = new WeakMap<CDPSessionLike, Map<ExecId, FrameId>>();

  /** Wire listeners for this session. Call BEFORE Runtime.enable. */
  attachSession(session: CDPSessionLike): void {
    const onCreated = (
      evt: Protocol.Runtime.ExecutionContextCreatedEvent,
    ): void => {
      const aux = (evt.context.auxData ?? {}) as {
        frameId?: string;
        isDefault?: boolean;
      };
      if (aux.isDefault === true && typeof aux.frameId === "string") {
        this.register(session, aux.frameId as FrameId, evt.context.id);
      }
    };
    const onDestroyed = (
      evt: Protocol.Runtime.ExecutionContextDestroyedEvent,
    ): void => {
      const rev = this.byExec.get(session);
      const fwd = this.byFrame.get(session);
      if (!rev || !fwd) return;
      const frameId = rev.get(evt.executionContextId);
      if (!frameId) return;
      rev.delete(evt.executionContextId);
      if (fwd.get(frameId) === evt.executionContextId) fwd.delete(frameId);
    };
    const onCleared = (): void => {
      this.byFrame.delete(session);
      this.byExec.delete(session);
    };

    session.on("Runtime.executionContextCreated", onCreated);
    session.on("Runtime.executionContextDestroyed", onDestroyed);
    session.on("Runtime.executionContextsCleared", onCleared);
  }

  getMainWorld(session: CDPSessionLike, frameId: FrameId): ExecId | null {
    return this.byFrame.get(session)?.get(frameId) ?? null;
  }

  async waitForMainWorld(
    session: CDPSessionLike,
    frameId: FrameId,
    timeoutMs: number = 800,
  ): Promise<ExecId> {
    const cached = this.getMainWorld(session, frameId);
    if (cached) return cached;

    await session.send("Runtime.enable").catch(() => {});
    const after = this.getMainWorld(session, frameId);
    if (after) return after;

    return await new Promise<ExecId>((resolve, reject) => {
      let done = false;
      const onCreated = (
        evt: Protocol.Runtime.ExecutionContextCreatedEvent,
      ): void => {
        const aux = (evt.context.auxData ?? {}) as {
          frameId?: string;
          isDefault?: boolean;
        };
        if (aux.isDefault === true && aux.frameId === frameId) {
          this.register(session, frameId, evt.context.id);
          if (!done) {
            done = true;
            clearTimeout(timer);
            session.off("Runtime.executionContextCreated", onCreated);
            resolve(evt.context.id);
          }
        }
      };
      const timer = setTimeout(() => {
        if (!done) {
          done = true;
          session.off("Runtime.executionContextCreated", onCreated);
          reject(new Error(`main world not ready for frame ${frameId}`));
        }
      }, timeoutMs);
      session.on("Runtime.executionContextCreated", onCreated);
    });
  }

  private register(
    session: CDPSessionLike,
    frameId: FrameId,
    ctxId: ExecId,
  ): void {
    let fwd = this.byFrame.get(session);
    if (!fwd) {
      fwd = new Map<FrameId, ExecId>();
      this.byFrame.set(session, fwd);
    }
    let rev = this.byExec.get(session);
    if (!rev) {
      rev = new Map<ExecId, FrameId>();
      this.byExec.set(session, rev);
    }
    fwd.set(frameId, ctxId);
    rev.set(ctxId, frameId);
  }
}

export const executionContexts = new ExecutionContextRegistry();


================================================
FILE: packages/core/lib/v3/understudy/fileUploadUtils.ts
================================================
import { promises as fs, type Stats } from "fs";
import path from "path";
import { Buffer } from "buffer";
import { StagehandInvalidArgumentError } from "../types/public/sdkErrors.js";
import {
  SetInputFilesArgument,
  SetInputFilePayload,
} from "../types/public/locator.js";
import { NormalizedFilePayload } from "../types/private/locator.js";

const DEFAULT_MIME_TYPE = "application/octet-stream";

/**
 * Normalize user-provided setInputFiles arguments into in-memory payloads.
 * - Resolves string paths relative to the provided base directory.
 * - Validates that each path exists and is a regular file.
 * - Converts all buffers into Node Buffers for downstream processing.
 */
export async function normalizeInputFiles(
  files: SetInputFilesArgument,
  opts: { baseDir?: string } = {},
): Promise<NormalizedFilePayload[]> {
  if (files === null || files === undefined) return [];

  const flattened = Array.isArray(files)
    ? (files as Array<string | SetInputFilePayload>)
    : [files];
  if (!flattened.length) return [];

  const baseDir = opts.baseDir ?? process.cwd();
  const normalized: NormalizedFilePayload[] = [];

  for (const entry of flattened) {
    if (typeof entry === "string") {
      const absolutePath = path.isAbsolute(entry)
        ? entry
        : path.resolve(baseDir, entry);
      const stat = await statFile(absolutePath);
      if (!stat.isFile()) {
        throw new StagehandInvalidArgumentError(
          `setInputFiles(): expected a file but received directory or special entry at ${absolutePath}`,
        );
      }
      const buffer = await fs.readFile(absolutePath);
      normalized.push({
        name: path.basename(absolutePath) || "upload.bin",
        mimeType: DEFAULT_MIME_TYPE,
        buffer,
        lastModified: stat.mtimeMs || Date.now(),
        absolutePath,
      });
      continue;
    }

    if (entry && typeof entry === "object" && "buffer" in entry) {
      const payload = entry as SetInputFilePayload;
      const buffer = toBuffer(payload.buffer);
      normalized.push({
        name: payload.name || "upload.bin",
        mimeType: payload.mimeType || DEFAULT_MIME_TYPE,
        buffer,
        lastModified:
          typeof payload.lastModified === "number"
            ? payload.lastModified
            : Date.now(),
      });
      continue;
    }

    throw new StagehandInvalidArgumentError(
      "setInputFiles(): expected file path(s) or payload object(s)",
    );
  }

  return normalized;
}

async function statFile(absolutePath: string): Promise<Stats> {
  try {
    return await fs.stat(absolutePath);
  } catch (error) {
    const code = (error as NodeJS.ErrnoException)?.code;
    if (code === "ENOENT") {
      throw new StagehandInvalidArgumentError(
        `setInputFiles(): file not found at ${absolutePath}`,
      );
    }
    throw error;
  }
}

export function toBuffer(
  data: ArrayBuffer | Uint8Array | Buffer | string,
): Buffer {
  if (Buffer.isBuffer(data)) return data;
  if (data instanceof Uint8Array) return Buffer.from(data);
  if (typeof data === "string") return Buffer.from(data);
  if (data instanceof ArrayBuffer) return Buffer.from(new Uint8Array(data));
  throw new StagehandInvalidArgumentError(
    "Unsupported file payload buffer type",
  );
}


================================================
FILE: packages/core/lib/v3/understudy/frame.ts
================================================
// lib/v3/understudy/frame.ts
import { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "./cdp.js";
import { Locator } from "./locator.js";
import { StagehandEvalError } from "../types/public/sdkErrors.js";
import { executionContexts } from "./executionContextRegistry.js";

interface FrameManager {
  session: CDPSessionLike;
  frameId: string;
  pageId: string;
}

/**
 * Frame
 *
 * A thin, session-bound handle to a specific DOM frame (by frameId).
 * All CDP calls in this class go through `this.session`, which MUST be the
 * owning session for `this.frameId`. Page is responsible for constructing
 * Frames with the correct session.
 */
export class Frame implements FrameManager {
  /** Owning CDP session id (useful for logs); null for root connection (should not happen for targets) */
  public readonly sessionId: string | null;

  constructor(
    public session: CDPSessionLike,
    public frameId: string,
    public pageId: string,
    private readonly remoteBrowser: boolean,
  ) {
    this.sessionId = this.session.id ?? null;
  }

  /** True when the controlled browser runs on a different machine. */
  public isBrowserRemote(): boolean {
    return this.remoteBrowser;
  }

  /** DOM.getNodeForLocation → DOM.describeNode */
  async getNodeAtLocation(x: number, y: number): Promise<Protocol.DOM.Node> {
    await this.session.send("DOM.enable");
    const { backendNodeId } = await this.session.send<{
      backendNodeId: Protocol.DOM.BackendNodeId;
    }>("DOM.getNodeForLocation", {
      x,
      y,
      includeUserAgentShadowDOM: true,
      ignorePointerEventsNone: false,
    });

    const { node } = await this.session.send<{
      node: Protocol.DOM.Node;
    }>("DOM.describeNode", { backendNodeId });

    return node;
  }

  /** CSS selector → DOM.querySelector → DOM.getBoxModel */
  async getLocationForSelector(
    selector: string,
  ): Promise<{ x: number; y: number; width: number; height: number }> {
    await this.session.send("DOM.enable");

    const { root } = await this.session.send<{ root: Protocol.DOM.Node }>(
      "DOM.getDocument",
    );

    const { nodeId } = await this.session.send<{ nodeId: Protocol.DOM.NodeId }>(
      "DOM.querySelector",
      { nodeId: root.nodeId, selector },
    );

    const { model } = await this.session.send<{ model: Protocol.DOM.BoxModel }>(
      "DOM.getBoxModel",
      { nodeId },
    );

    const x = model.content[0];
    const y = model.content[1];
    const width = model.width;
    const height = model.height;
    return { x, y, width, height };
  }

  /** Accessibility.getFullAXTree (+ recurse into child frames if requested) */
  async getAccessibilityTree(
    withFrames = false,
  ): Promise<Protocol.Accessibility.AXNode[]> {
    await this.session.send("Accessibility.enable");
    let nodes: Protocol.Accessibility.AXNode[];
    try {
      ({ nodes } = await this.session.send<{
        nodes: Protocol.Accessibility.AXNode[];
      }>("Accessibility.getFullAXTree", { frameId: this.frameId }));
    } catch (e) {
      const msg = String((e as Error)?.message ?? e ?? "");
      const isFrameScopeError =
        msg.includes("Frame with the given") ||
        msg.includes("does not belong to the target") ||
        msg.includes("is not found");
      if (!isFrameScopeError) throw e;
      // Retry unscoped: on OOPIF sessions, returns the child doc's AX tree.
      ({ nodes } = await this.session.send<{
        nodes: Protocol.Accessibility.AXNode[];
      }>("Accessibility.getFullAXTree"));
    }

    if (!withFrames) return nodes;

    const children = await this.childFrames();
    for (const child of children) {
      const childNodes = await child.getAccessibilityTree(false);
      nodes.push(...childNodes);
    }
    return nodes;
  }

  /**
   * Evaluate a function or expression in this frame's main world.
   * - If a string is provided, treated as a JS expression.
   * - If a function is provided, it is stringified and invoked with the optional argument.
   */
  async evaluate<R = unknown, Arg = unknown>(
    pageFunctionOrExpression: string | ((arg: Arg) => R | Promise<R>),
    arg?: Arg,
  ): Promise<R> {
    await this.session.send("Runtime.enable").catch(() => {});
    const contextId = await this.getMainWorldExecutionContextId();

    const isString = typeof pageFunctionOrExpression === "string";
    let expression: string;

    if (isString) {
      expression = String(pageFunctionOrExpression);
    } else {
      const fnSrc = pageFunctionOrExpression.toString();
      const argJson = JSON.stringify(arg);
      expression = `(() => {
        const __fn = ${fnSrc};
        const __arg = ${argJson};
        try {
          const __res = __fn(__arg);
          return Promise.resolve(__res).then(v => {
            try { return JSON.parse(JSON.stringify(v)); } catch { return v; }
          });
        } catch (e) { throw e; }
      })()`;
    }

    let res: Protocol.Runtime.EvaluateResponse;
    try {
      res = await this.session.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression,
          contextId,
          awaitPromise: true,
          returnByValue: true,
        },
      );
    } catch (error) {
      // Execution contexts can be recreated between context lookup and
      // Runtime.evaluate during popup/navigate churn. Retry once with a fresh id.
      const msg = error instanceof Error ? error.message : String(error);
      if (!msg.includes("Cannot find context with specified id")) throw error;
      const freshContextId = await this.getMainWorldExecutionContextId();
      res = await this.session.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression,
          contextId: freshContextId,
          awaitPromise: true,
          returnByValue: true,
        },
      );
    }
    if (res.exceptionDetails) {
      throw new StagehandEvalError(
        res.exceptionDetails.text ?? "Evaluation failed",
      );
    }
    return res.result.value as R;
  }

  /** Page.captureScreenshot (frame-scoped session) */
  async screenshot(options?: {
    fullPage?: boolean;
    clip?: { x: number; y: number; width: number; height: number };
    type?: "png" | "jpeg";
    quality?: number;
    scale?: number;
  }): Promise<Buffer> {
    await this.session.send("Page.enable");
    const format = options?.type ?? "png";
    const params: Protocol.Page.CaptureScreenshotRequest & { scale?: number } =
      {
        format,
        fromSurface: true,
        captureBeyondViewport: options?.fullPage,
      };

    const clampScale = (value: number): number =>
      Math.min(2, Math.max(0.1, value));

    const normalizedScale =
      typeof options?.scale === "number"
        ? clampScale(options.scale)
        : undefined;

    if (options?.clip) {
      const clip = {
        x: options.clip.x,
        y: options.clip.y,
        width: options.clip.width,
        height: options.clip.height,
        scale: normalizedScale ?? 1,
      };
      params.clip = clip;
    } else if (normalizedScale !== undefined && normalizedScale !== 1) {
      params.scale = normalizedScale;
    }

    if (format === "jpeg" && typeof options?.quality === "number") {
      const q = Math.round(options.quality);
      params.quality = Math.min(100, Math.max(0, q));
    }

    const { data } =
      await this.session.send<Protocol.Page.CaptureScreenshotResponse>(
        "Page.captureScreenshot",
        params,
      );
    return Buffer.from(data, "base64");
  }

  /** Child frames via Page.getFrameTree */
  async childFrames(): Promise<Frame[]> {
    const { frameTree } = await this.session.send<{
      frameTree: Protocol.Page.FrameTree;
    }>("Page.getFrameTree");
    const frames: Frame[] = [];

    const collect = (tree: Protocol.Page.FrameTree) => {
      if (tree.frame.parentId === this.frameId) {
        frames.push(
          new Frame(
            this.session,
            tree.frame.id,
            this.pageId,
            this.remoteBrowser,
          ),
        );
      }
      tree.childFrames?.forEach(collect);
    };

    collect(frameTree);
    return frames;
  }

  /** Wait for a lifecycle state (load/domcontentloaded/networkidle) */
  async waitForLoadState(
    state: "load" | "domcontentloaded" | "networkidle" = "load",
    timeoutMs: number = 15_000,
  ): Promise<void> {
    await this.session.send("Page.enable");
    const targetState = state.toLowerCase();
    const timeout = Math.max(0, timeoutMs);
    await new Promise<void>((resolve, reject) => {
      let done = false;
      let timer: ReturnType<typeof setTimeout> | null = null;
      const finish = () => {
        if (done) return;
        done = true;
        this.session.off("Page.lifecycleEvent", handler);
        if (timer) {
          clearTimeout(timer);
          timer = null;
        }
        resolve();
      };
      const handler = (evt: Protocol.Page.LifecycleEventEvent) => {
        const sameFrame = evt.frameId === this.frameId;
        // need to normalize here because CDP lifecycle names look like 'DOMContentLoaded'
        // but we accept 'domcontentloaded'
        const lifecycleName = String(evt.name ?? "").toLowerCase();
        if (sameFrame && lifecycleName === targetState) {
          finish();
        }
      };
      this.session.on("Page.lifecycleEvent", handler);

      timer = setTimeout(() => {
        if (done) return;
        done = true;
        this.session.off("Page.lifecycleEvent", handler);
        reject(
          new Error(
            `waitForLoadState(${state}) timed out after ${timeout}ms for frame ${this.frameId}`,
          ),
        );
      }, timeout);
    });
  }

  /** Simple placeholder for your own locator abstraction */
  locator(
    selector: string,
    options?: { deep?: boolean; depth?: number },
  ): Locator {
    return new Locator(this, selector, options);
  }

  /** Resolve the main-world execution context id for this frame. */
  private async getMainWorldExecutionContextId(): Promise<number> {
    return executionContexts.waitForMainWorld(this.session, this.frameId, 1000);
  }
}


================================================
FILE: packages/core/lib/v3/understudy/frameLocator.ts
================================================
import type { Protocol } from "devtools-protocol";
import { Locator } from "./locator.js";
import type { Page } from "./page.js";
import { Frame } from "./frame.js";
import { executionContexts } from "./executionContextRegistry.js";
import {
  ContentFrameNotFoundError,
  StagehandInvalidArgumentError,
} from "../types/public/sdkErrors.js";

/**
 * FrameLocator: resolves iframe elements to their child Frames and allows
 * creating locators scoped to that frame. Supports chaining.
 */
export class FrameLocator {
  private readonly parent?: FrameLocator;
  private readonly selector: string;
  private readonly page: Page;
  private readonly root?: Frame;

  constructor(
    page: Page,
    selector: string,
    parent?: FrameLocator,
    root?: Frame,
  ) {
    this.page = page;
    this.selector = selector;
    this.parent = parent;
    this.root = root;
  }

  /** Create a nested FrameLocator under this one. */
  frameLocator(selector: string): FrameLocator {
    return new FrameLocator(this.page, selector, this);
  }

  /** Resolve to the concrete Frame for this FrameLocator chain. */
  async resolveFrame(): Promise<Frame> {
    const parentFrame: Frame = this.parent
      ? await this.parent.resolveFrame()
      : (this.root ?? this.page.mainFrame());

    // Resolve the iframe element inside the parent frame
    const tmp = parentFrame.locator(this.selector);
    const parentSession = parentFrame.session;
    const { objectId } = await tmp.resolveNode();

    try {
      await parentSession.send("DOM.enable").catch(() => {});
      const desc = await parentSession.send<Protocol.DOM.DescribeNodeResponse>(
        "DOM.describeNode",
        { objectId },
      );
      const iframeBackendNodeId = desc.node.backendNodeId;

      // Find direct child frames under the parent by consulting the Page's registry
      const childIds = await listDirectChildFrameIdsFromRegistry(
        this.page,
        parentFrame.frameId,
        1000,
      );

      for (const fid of childIds) {
        try {
          const owner = await parentSession.send<{
            backendNodeId: Protocol.DOM.BackendNodeId;
            nodeId?: Protocol.DOM.NodeId;
          }>("DOM.getFrameOwner", { frameId: fid as Protocol.Page.FrameId });
          if (owner.backendNodeId === iframeBackendNodeId) {
            // Ensure child frame is ready (handles OOPIF adoption or same-process)
            await ensureChildFrameReady(this.page, parentFrame, fid, 1200);
            return this.page.frameForId(fid);
          }
        } catch {
          // ignore and try next
        }
      }
      throw new ContentFrameNotFoundError(this.selector);
    } finally {
      await parentSession
        .send("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /** Return a Locator scoped to this frame. Methods delegate to the frame lazily. */
  locator(selector: string): LocatorDelegate {
    return new LocatorDelegate(this, selector);
  }
}

/** A small delegating wrapper that resolves the frame lazily per call. */
class LocatorDelegate {
  constructor(
    private readonly fl: FrameLocator,
    private readonly sel: string,
    private readonly nthIndex: number = -1,
  ) {}

  private async real(): Promise<Locator> {
    const frame = await this.fl.resolveFrame();
    const locator = frame.locator(this.sel);
    if (this.nthIndex < 0) return locator;
    return locator.nth(this.nthIndex);
  }

  // Locator API delegates
  async click(options?: {
    button?: "left" | "right" | "middle";
    clickCount?: number;
  }) {
    return (await this.real()).click(options);
  }
  async hover() {
    return (await this.real()).hover();
  }
  async fill(value: string) {
    return (await this.real()).fill(value);
  }
  async type(text: string, options?: { delay?: number }) {
    return (await this.real()).type(text, options);
  }
  async selectOption(values: string | string[]) {
    return (await this.real()).selectOption(values);
  }
  async scrollTo(percent: number | string) {
    return (await this.real()).scrollTo(percent);
  }
  async isVisible() {
    return (await this.real()).isVisible();
  }
  async isChecked() {
    return (await this.real()).isChecked();
  }
  async inputValue() {
    return (await this.real()).inputValue();
  }
  async textContent() {
    return (await this.real()).textContent();
  }
  async innerHtml() {
    return (await this.real()).innerHtml();
  }
  async innerText() {
    return (await this.real()).innerText();
  }
  async count() {
    return (await this.real()).count();
  }
  first(): LocatorDelegate {
    return this.nth(0);
  }
  nth(index: number): LocatorDelegate {
    const value = Number(index);
    if (!Number.isFinite(value) || value < 0) {
      throw new StagehandInvalidArgumentError(
        "locator().nth() expects a non-negative index",
      );
    }

    const nextIndex = Math.floor(value);
    if (nextIndex === this.nthIndex) return this;

    return new LocatorDelegate(this.fl, this.sel, nextIndex);
  }
}

/** Factory to start a FrameLocator chain from an arbitrary root Frame. */
export function frameLocatorFromFrame(
  page: Page,
  root: Frame,
  selector: string,
): FrameLocator {
  return new FrameLocator(page, selector, undefined, root);
}

async function listDirectChildFrameIdsFromRegistry(
  page: Page,
  parentFrameId: string,
  timeoutMs: number,
): Promise<string[]> {
  const deadline = Date.now() + timeoutMs;
  while (true) {
    try {
      const tree = page.getFullFrameTree();
      const node = findFrameNode(tree, parentFrameId);
      const ids = node?.childFrames?.map((c) => c.frame.id as string) ?? [];
      if (ids.length > 0 || Date.now() >= deadline) return ids;
    } catch {
      // ignore
    }
    await new Promise((r) => setTimeout(r, 50));
  }
}

function findFrameNode(
  tree: Protocol.Page.FrameTree,
  targetId: string,
): Protocol.Page.FrameTree | undefined {
  if (tree.frame.id === targetId) return tree;
  for (const c of tree.childFrames ?? []) {
    const hit = findFrameNode(c, targetId);
    if (hit) return hit;
  }
  return undefined;
}

/**
 * Ensure we can evaluate in the child frame with minimal delay.
 * - If the child is same-process: parent session owns it and main world appears quickly.
 * - If OOPIF and adoption not finished: wait briefly for ownership change, then main world.
 */
async function ensureChildFrameReady(
  page: Page,
  parentFrame: Frame,
  childFrameId: string,
  budgetMs: number,
): Promise<void> {
  const parentSession = parentFrame.session;
  const deadline = Date.now() + Math.max(0, budgetMs);

  // If already owned by a different session (OOPIF adopted), wait briefly there.
  const owner = page.getSessionForFrame(childFrameId);
  if (owner && owner !== parentSession) {
    try {
      await executionContexts.waitForMainWorld(owner, childFrameId, 600);
    } catch {
      // best effort
    }
    return;
  }

  const hasMainWorldOnParent = (): boolean => {
    try {
      return (
        executionContexts.getMainWorld(parentSession, childFrameId) !== null
      );
    } catch {
      return false;
    }
  };

  if (hasMainWorldOnParent()) return;

  await parentSession
    .send("Page.setLifecycleEventsEnabled", { enabled: true })
    .catch(() => {});
  await parentSession.send("Runtime.enable").catch(() => {});

  await new Promise<void>((resolve) => {
    let done = false;
    const finish = () => {
      if (done) return;
      done = true;
      parentSession.off("Page.lifecycleEvent", onLifecycle);
      resolve();
    };
    const onLifecycle = (evt: Protocol.Page.LifecycleEventEvent) => {
      if (
        evt.frameId !== childFrameId ||
        (evt.name !== "DOMContentLoaded" &&
          evt.name !== "load" &&
          evt.name !== "networkIdle" &&
          evt.name !== "networkidle")
      ) {
        return;
      }
      if (hasMainWorldOnParent()) return finish();
      try {
        const nowOwner = page.getSessionForFrame(childFrameId);
        if (nowOwner && nowOwner !== parentSession) {
          const left = Math.max(150, deadline - Date.now());
          executionContexts
            .waitForMainWorld(nowOwner, childFrameId, left)
            .finally(finish);
        }
      } catch {
        // ignore
      }
    };
    parentSession.on("Page.lifecycleEvent", onLifecycle);

    const tick = () => {
      if (done) return;
      if (hasMainWorldOnParent()) return finish();
      try {
        const nowOwner = page.getSessionForFrame(childFrameId);
        if (nowOwner && nowOwner !== parentSession) {
          const left = Math.max(150, deadline - Date.now());
          executionContexts
            .waitForMainWorld(nowOwner, childFrameId, left)
            .finally(finish);
          return;
        }
      } catch {
        // ignore
      }
      if (Date.now() >= deadline) return finish();
      setTimeout(tick, 50);
    };
    tick();
  });
}


================================================
FILE: packages/core/lib/v3/understudy/frameRegistry.ts
================================================
// lib/v3/understudy/frameRegistry.ts
import type { Protocol } from "devtools-protocol";

/**
 * FrameRegistry
 *
 * Purpose:
 * A single, authoritative source of truth for **both**:
 *   1) Frame topology (parent/children, current main/root id, last-seen CDP `Frame`)
 *   2) Frame → Session ownership (which CDP session owns a given frameId)
 *   3) Optional iframe-owner metadata (backendNodeId of the <iframe> element in the parent doc)
 *
 *
 * Model:
 *  - This class is **CDP-agnostic**; it stores **sessionId strings** (not session objects).
 *  - Context bridges (wiring Target/Page events) must call the mutators below (onAttached,
 *    onNavigated, onDetached, adoptChildSession, seedFromFrameTree, setOwnerBackendNodeId).
 *  - Consumers ask read APIs (getOwnerSessionId, getParent, asProtocolFrameTree, listAll, …)
 *    and never probe ownership at run time.
 */

type FrameId = string;
type SessionId = string;

type FrameInfo = {
  /** Parent frame id, or null for root */
  parentId: FrameId | null;
  /** Children frame ids (direct) */
  children: Set<FrameId>;
  /** Last-seen CDP Frame metadata for this id (may be a shell if never seen) */
  lastSeen?: Protocol.Page.Frame;

  /** Owning session id (CDP child session for OOPIF, top-level session for same-process) */
  ownerSessionId?: SessionId;

  /**
   * The backendNodeId of the <iframe> element **in the parent document** that hosts this frame.
   * Useful for building absolute XPath prefixes or DOM scoping in the parent session.
   */
  ownerBackendNodeId?: number;
};

/** Minimal “shell” CDP frame used when we haven’t yet seen a real Frame from events. */
function shellFrame(id: FrameId): Protocol.Page.Frame {
  return {
    id,
    loaderId: "",
    url: "",
    domainAndRegistry: "",
    securityOrigin: "",
    mimeType: "text/html",
    secureContextType: "InsecureScheme",
    crossOriginIsolatedContextType: "NotIsolated",
    gatedAPIFeatures: [],
  } as Protocol.Page.Frame;
}

export class FrameRegistry {
  /** Owner target id (top-level target); informational only */
  private readonly ownerTargetId: string;

  /** Current main/root frame id (changes on root swaps) */
  private rootFrameId: FrameId;

  /** frameId → FrameInfo */
  private frames = new Map<FrameId, FrameInfo>();

  /** sessionId → Set<frameId> (inverse map for diagnostics/fast membership checks) */
  private framesBySession = new Map<SessionId, Set<FrameId>>();

  constructor(ownerTargetId: string, mainFrameId: FrameId) {
    this.ownerTargetId = ownerTargetId;
    this.rootFrameId = mainFrameId;
    this.ensureNode(mainFrameId);
  }

  // ---------------------- Mutators (called by Context/Page bridges) ----------------------

  /**
   * Record that a frame attached. If `parentId` is null and `frameId` differs from the current
   * root, this is a root swap and we rename the root id.
   *
   * IMPORTANT: The emitter's `sessionId` is the **owner** for the new/attached frame.
   */
  onFrameAttached(
    frameId: FrameId,
    parentId: FrameId | null,
    sessionId: SessionId,
  ): void {
    // Root swap (parentId === null for main frames).
    if (!parentId && frameId !== this.rootFrameId) {
      this.renameNodeId(this.rootFrameId, frameId);
      this.rootFrameId = frameId;
      // ownership moves to this session as well
      this.setOwnerSessionIdInternal(frameId, sessionId);
      return;
    }

    // Normal attach
    this.ensureNode(frameId);
    if (parentId) this.ensureNode(parentId);

    const info = this.frames.get(frameId)!;
    info.parentId = parentId ?? null;

    if (parentId) {
      this.frames.get(parentId)!.children.add(frameId);
    }

    // Ownership: the session that emitted frameAttached owns this frame.
    this.setOwnerSessionIdInternal(frameId, sessionId);
  }

  /**
   * Record a navigation with the full CDP `Frame`. Also updates ownership based on the emitting
   * session id. Handles root swap if the navigated frame is the new main (no parentId).
   */
  onFrameNavigated(frame: Protocol.Page.Frame, sessionId: SessionId): void {
    this.ensureNode(frame.id);
    const info = this.frames.get(frame.id)!;
    info.lastSeen = frame;

    // Ownership follows the session that reported the navigation
    this.setOwnerSessionIdInternal(frame.id, sessionId);

    // If this frame has no parent, it might be the (new) main/root
    if (!("parentId" in frame) || !frame.parentId) {
      if (frame.id !== this.rootFrameId) {
        // carry ordinal semantics by renaming the root id
        this.renameNodeId(this.rootFrameId, frame.id);
        this.rootFrameId = frame.id;
      }
    }
  }

  onNavigatedWithinDocument(
    frameId: FrameId,
    url: string,
    sessionId: SessionId,
  ): void {
    this.ensureNode(frameId);
    const info = this.frames.get(frameId)!;
    const lastSeen = info.lastSeen ?? shellFrame(frameId);
    info.lastSeen = { ...lastSeen, url };
    this.setOwnerSessionIdInternal(frameId, sessionId);
  }

  /**
   * Record that a frame detached. If `reason !== "swap"`, remove the subtree from the graph,
   * and clean the inverse maps. For “swap” we keep the node to preserve continuity.
   */
  onFrameDetached(
    frameId: FrameId,
    reason: "remove" | "swap" | string = "remove",
  ): void {
    if (reason === "swap") return;

    // Collect subtree starting from frameId.
    const toRemove: FrameId[] = [];
    const collect = (fid: FrameId) => {
      toRemove.push(fid);
      const kids = this.frames.get(fid)?.children ?? new Set<FrameId>();
      for (const k of kids) collect(k);
    };
    collect(frameId);

    // Remove nodes, fix parents and inverse maps
    for (const fid of toRemove) {
      const info = this.frames.get(fid);
      if (!info) continue;

      // unlink from parent
      if (info.parentId) {
        const p = this.frames.get(info.parentId);
        p?.children.delete(fid);
      }

      // unlink inverse session map
      if (info.ownerSessionId) {
        const bag = this.framesBySession.get(info.ownerSessionId);
        bag?.delete(fid);
        if (bag && bag.size === 0)
          this.framesBySession.delete(info.ownerSessionId);
      }

      this.frames.delete(fid);
    }

    // Guard root if we removed it; assign a placeholder root if needed
    if (!this.frames.has(this.rootFrameId)) {
      // Choose an arbitrary remaining node as root
      const iter = this.frames.keys().next();
      if (!iter.done) this.rootFrameId = iter.value;
    }
  }

  /**
   * An adopted OOPIF child session was created whose **main** frame id equals the parent iframe’s frameId.
   * We mark the entire child subtree as owned by `childSessionId`.
   * (Topology edges remain aligned by the parent session’s `frameAttached` events.)
   */
  adoptChildSession(
    childSessionId: SessionId,
    childMainFrameId: FrameId,
  ): void {
    // The child session will emit its own navigations/attachments; as a seed,
    // mark the root frame as owned by the child session.
    this.setOwnerSessionIdInternal(childMainFrameId, childSessionId);
  }

  /**
   * Seed topology and ownership from an existing `Page.getFrameTree` snapshot, typically right after
   * a session is attached. This is a best-effort: we record frames and set the provided `sessionId`
   * as owner for the subtree **if** an owner isn't already set.
   */
  seedFromFrameTree(
    sessionId: SessionId,
    frameTree: Protocol.Page.FrameTree,
  ): void {
    const walk = (tree: Protocol.Page.FrameTree, parent: FrameId | null) => {
      this.ensureNode(tree.frame.id);
      // topology
      this.frames.get(tree.frame.id)!.parentId = parent;
      if (parent) this.frames.get(parent)!.children.add(tree.frame.id);
      // last-seen frame
      this.frames.get(tree.frame.id)!.lastSeen = tree.frame;
      // ownership (only if unknown)
      if (!this.frames.get(tree.frame.id)!.ownerSessionId) {
        this.setOwnerSessionIdInternal(tree.frame.id, sessionId);
      }
      for (const c of tree.childFrames ?? []) walk(c, tree.frame.id);
    };
    walk(frameTree, null);
  }

  /**
   * Set the backendNodeId of the `<iframe>` element for a child frame **as seen from its parent**.
   * This is useful for building absolute XPath prefixes later (from the parent document).
   */
  setOwnerBackendNodeId(childFrameId: FrameId, backendNodeId: number): void {
    this.ensureNode(childFrameId);
    this.frames.get(childFrameId)!.ownerBackendNodeId = backendNodeId;
  }

  // ---------------------- Readers (consumed by Page/snapshot/locators) ----------------------

  mainFrameId(): FrameId {
    return this.rootFrameId;
  }

  /**
   * Return the owner session id for this frame. If unknown, returns `undefined`.
   */
  getOwnerSessionId(frameId: FrameId): SessionId | undefined {
    return this.frames.get(frameId)?.ownerSessionId;
  }

  /**
   * Return the owner backendNodeId (iframe element) if recorded.
   * This is in the **parent** document; pair it with `getParent`.
   */
  getOwnerBackendNodeId(frameId: FrameId): number | undefined {
    return this.frames.get(frameId)?.ownerBackendNodeId;
  }

  /**
   * Return the parent frame id, or null for root/unknown.
   */
  getParent(frameId: FrameId): FrameId | null {
    return this.frames.get(frameId)?.parentId ?? null;
  }

  /**
   * List frame ids in root-first DFS order (same shape as CDP’s FrameTree traversal).
   */
  listAllFrames(): FrameId[] {
    const out: FrameId[] = [];
    const dfs = (fid: FrameId) => {
      out.push(fid);
      const kids = this.frames.get(fid)?.children ?? new Set<FrameId>();
      for (const k of kids) dfs(k);
    };
    if (this.frames.has(this.rootFrameId)) dfs(this.rootFrameId);
    return out;
  }

  /**
   * Serialize to `Protocol.Page.FrameTree` starting at the given root id (typically mainFrameId()).
   */
  asProtocolFrameTree(rootId: FrameId): Protocol.Page.FrameTree {
    const build = (fid: FrameId): Protocol.Page.FrameTree => {
      const info = this.frames.get(fid);
      const frame = info?.lastSeen ?? shellFrame(fid);

      const kids = info?.children ?? new Set<FrameId>();
      const childFrames = kids.size
        ? [...kids].map((k) => build(k))
        : undefined;

      return childFrames ? { frame, childFrames } : { frame };
    };

    return build(rootId);
  }

  /**
   * For diagnostics: return the current owner sessions for a frame id (0..n),
   * usually 0 or 1, but helpful to see potential inconsistencies during wiring.
   */
  sessionsForFrame(frameId: FrameId): SessionId[] {
    const info = this.frames.get(frameId);
    return info?.ownerSessionId ? [info.ownerSessionId] : [];
  }

  /**
   * For diagnostics: return current frame set per session.
   */
  framesForSession(sessionId: SessionId): FrameId[] {
    return [...(this.framesBySession.get(sessionId) ?? new Set())];
  }

  // ---------------------- Internal helpers ----------------------

  private ensureNode(fid: FrameId): void {
    if (this.frames.has(fid)) return;
    this.frames.set(fid, {
      parentId: null,
      children: new Set<FrameId>(),
      lastSeen: shellFrame(fid),
      ownerSessionId: undefined,
      ownerBackendNodeId: undefined,
    });
  }

  private renameNodeId(oldId: FrameId, newId: FrameId): void {
    if (oldId === newId) return;
    this.ensureNode(oldId);

    const info = this.frames.get(oldId)!;

    // Move info under new id
    this.frames.delete(oldId);
    this.frames.set(newId, { ...info });

    // Fix parent’s children set
    if (info.parentId) {
      const p = this.frames.get(info.parentId);
      if (p) {
        p.children.delete(oldId);
        p.children.add(newId);
      }
    }

    // Fix children’s parent pointers
    for (const c of info.children) {
      const ci = this.frames.get(c);
      if (ci) ci.parentId = newId;
    }

    // Fix inverse map (session -> frames)
    if (info.ownerSessionId) {
      const bag = this.framesBySession.get(info.ownerSessionId);
      if (bag) {
        bag.delete(oldId);
        bag.add(newId);
      }
    }

    // If root moved, keep the root id updated is handled by caller
  }

  private setOwnerSessionIdInternal(
    frameId: FrameId,
    sessionId: SessionId,
  ): void {
    this.ensureNode(frameId);
    const info = this.frames.get(frameId)!;

    // If the owner is unchanged, do nothing
    if (info.ownerSessionId === sessionId) return;

    // Remove from previous owner bag
    if (info.ownerSessionId) {
      const prev = this.framesBySession.get(info.ownerSessionId);
      prev?.delete(frameId);
      if (prev && prev.size === 0)
        this.framesBySession.delete(info.ownerSessionId);
    }

    // Set new owner and update bag
    info.ownerSessionId = sessionId;
    const bag = this.framesBySession.get(sessionId) ?? new Set<FrameId>();
    bag.add(frameId);
    this.framesBySession.set(sessionId, bag);
  }
}


================================================
FILE: packages/core/lib/v3/understudy/initScripts.ts
================================================
import { promises as fs } from "fs";
import { InitScriptSource } from "../types/private/index.js";
import { StagehandInvalidArgumentError } from "../types/public/sdkErrors.js";

const DEFAULT_CALLER = "context.addInitScript";

function appendSourceURL(source: string, filePath: string): string {
  const sanitized = filePath.replace(/\n/g, "");
  return `${source}\n//# sourceURL=${sanitized}`;
}

export async function normalizeInitScriptSource<Arg>(
  script: InitScriptSource<Arg>,
  arg?: Arg,
  caller: string = DEFAULT_CALLER,
): Promise<string> {
  if (typeof script === "function") {
    const argString = Object.is(arg, undefined)
      ? "undefined"
      : JSON.stringify(arg);
    return `(${script.toString()})(${argString})`;
  }

  if (!Object.is(arg, undefined)) {
    throw new StagehandInvalidArgumentError(
      `${caller}: 'arg' is only supported when passing a function.`,
    );
  }

  if (typeof script === "string") {
    return script;
  }

  if (!script || typeof script !== "object") {
    throw new StagehandInvalidArgumentError(
      `${caller}: provide a string, function, or an object with path/content.`,
    );
  }

  if (typeof script.content === "string") {
    return script.content;
  }

  if (typeof script.path === "string" && script.path.trim()) {
    const raw = await fs.readFile(script.path, "utf8");
    return appendSourceURL(raw, script.path);
  }

  throw new StagehandInvalidArgumentError(
    `${caller}: provide a string, function, or an object with path/content.`,
  );
}


================================================
FILE: packages/core/lib/v3/understudy/lifecycleWatcher.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { LoadState } from "../types/public/page.js";
import type { CDPSessionLike } from "./cdp.js";
import type { NetworkManager } from "./networkManager.js";
import type { Page } from "./page.js";
import { TimeoutError } from "../types/public/sdkErrors.js";
import {
  DEFAULT_IDLE_WAIT,
  IGNORED_RESOURCE_TYPES,
  type NetworkRequestInfo,
  WaitForIdleHandle,
} from "../types/private/network.js";

/**
 * Coordinates page lifecycle waits (load/domcontentloaded/networkidle) while
 * following main-frame swaps and navigation aborts. Each navigation spawns a
 * one-off watcher that listens for relevant CDP events and resolves or rejects
 * depending on the requested `waitUntil` state.
 */

/**
 * Small utility that mirrors Playwright's lifecycle watcher semantics. Bridges
 * main-frame lifecycle events with the NetworkManager's idle signal so callers
 * can await `load`, `domcontentloaded`, or `networkidle` with a single promise.
 */
export class LifecycleWatcher {
  private readonly page: Page;
  private readonly mainSession: CDPSessionLike;
  private readonly networkManager: NetworkManager;
  private readonly waitUntil: LoadState;
  private readonly timeoutMs: number;
  private readonly startTime: number;
  private readonly navigationCommandId: number;
  private currentLoaderId: string | undefined;
  private idleStartTime: number;

  private cleanupCallbacks: Array<() => void> = [];
  private idleHandle: WaitForIdleHandle | null = null;

  private abortReject: ((error: Error) => void) | null = null;
  private abortPromise: Promise<never>;
  private abortError: Error | null = null;
  private disposed = false;

  private expectedLoaderId: string | undefined;
  private initialLoaderId: string | undefined;
  private pendingFollowupNavigation = false;

  /**
   * Create a watcher; callers should subsequently invoke {@link wait}.
   */
  constructor(params: {
    page: Page;
    mainSession: CDPSessionLike;
    networkManager: NetworkManager;
    waitUntil: LoadState;
    timeoutMs: number;
    navigationCommandId: number;
  }) {
    this.page = params.page;
    this.mainSession = params.mainSession;
    this.networkManager = params.networkManager;
    this.waitUntil = params.waitUntil;
    this.timeoutMs = params.timeoutMs;
    this.startTime = Date.now();
    this.navigationCommandId = params.navigationCommandId;
    this.idleStartTime = this.startTime;

    this.abortPromise = new Promise<never>((_, reject) => {
      this.abortReject = reject;
    });

    this.installSessionListeners();
  }

  /** Hint the watcher with the loader id returned by Page.navigate. */
  public setExpectedLoaderId(loaderId: string | undefined): void {
    if (!loaderId) return;
    this.expectedLoaderId = loaderId;
    this.initialLoaderId = loaderId;
    this.currentLoaderId = loaderId;
    this.idleStartTime = Date.now();
  }

  /** Wait for the requested lifecycle state or throw on timeout/abort. */
  public async wait(): Promise<void> {
    const deadline = Date.now() + this.timeoutMs;

    try {
      if (this.waitUntil === "domcontentloaded") {
        await this.awaitWithAbort(
          this.page.waitForMainLoadState(
            "domcontentloaded",
            this.timeRemaining(deadline),
          ),
        );
        return;
      }

      while (true) {
        await this.awaitWithAbort(
          this.page.waitForMainLoadState("load", this.timeRemaining(deadline)),
        );

        if (this.waitUntil !== "networkidle") break;

        try {
          await this.awaitWithAbort(this.waitForNetworkIdle(deadline));
          break;
        } catch (error) {
          if (this.shouldRestartAfterFollowup(error)) {
            continue;
          }
          throw error;
        }
      }
    } finally {
      this.dispose();
    }

    if (this.abortError) throw this.abortError;
  }

  /** Cancel any outstanding network-idle waits and remove event listeners. */
  public dispose(): void {
    if (this.disposed) return;
    this.disposed = true;

    if (this.idleHandle) {
      void this.idleHandle.promise.catch(() => {});
      this.idleHandle.dispose();
      this.idleHandle = null;
    }

    for (const fn of this.cleanupCallbacks) {
      try {
        fn();
      } catch {
        // ignore listener cleanup errors
      }
    }
    this.cleanupCallbacks = [];
    this.abortReject = null;
  }

  /** Subscribe to main-frame events to detect abort conditions. */
  private installSessionListeners(): void {
    const onFrameNavigated = (evt: Protocol.Page.FrameNavigatedEvent) => {
      if (!evt?.frame?.id) return;

      const mainFrameId = this.page.mainFrameId();
      if (evt.frame.id !== mainFrameId) return;

      const loaderId = evt.frame.loaderId;
      if (!loaderId) return;

      if (!this.initialLoaderId) {
        this.initialLoaderId = loaderId;
        this.currentLoaderId = loaderId;
        this.idleStartTime = Date.now();
      }

      if (!this.expectedLoaderId) {
        this.expectedLoaderId = loaderId;
        this.currentLoaderId = loaderId;
        this.idleStartTime = Date.now();
        return;
      }

      if (loaderId !== this.expectedLoaderId) {
        if (!this.page.isCurrentNavigationCommand(this.navigationCommandId)) {
          this.triggerAbort(
            new Error("Navigation was superseded by a new request"),
          );
          return;
        }

        this.adoptNewMainLoader(loaderId);
      }
    };

    const onFrameDetached = (evt: Protocol.Page.FrameDetachedEvent) => {
      if (!evt?.frameId) return;
      const mainFrameId = this.page.mainFrameId();
      if (evt.frameId !== mainFrameId) return;
      if (evt.reason === "swap") return;
      this.triggerAbort(new Error("Main frame was detached"));
    };

    this.mainSession.on("Page.frameNavigated", onFrameNavigated);
    this.cleanupCallbacks.push(() => {
      this.mainSession.off("Page.frameNavigated", onFrameNavigated);
    });

    this.mainSession.on("Page.frameDetached", onFrameDetached);
    this.cleanupCallbacks.push(() => {
      this.mainSession.off("Page.frameDetached", onFrameDetached);
    });
  }

  /** Compute remaining time until the shared deadline elapses. */
  private timeRemaining(deadline: number): number {
    const remaining = deadline - Date.now();
    if (remaining <= 0) {
      throw new TimeoutError("Lifecycle wait", this.timeoutMs);
    }
    return remaining;
  }

  /** Await an operation but abort early if navigation replacement fires. */
  private async awaitWithAbort<T>(operation: Promise<T>): Promise<T> {
    try {
      return await Promise.race([operation, this.abortPromise]);
    } catch (error) {
      if (this.abortError) throw this.abortError;
      throw error;
    }
  }

  /** Mark the watcher as aborted and reject any pending waiters. */
  private triggerAbort(error: Error): void {
    if (this.abortError) return;
    this.abortError = error;
    if (this.abortReject) {
      this.abortReject(error);
      this.abortReject = null;
    }
  }
  private waitForNetworkIdle(deadline: number): Promise<void> {
    this.pendingFollowupNavigation = false;
    const remaining = this.timeRemaining(deadline);
    const idleWindow = Math.min(DEFAULT_IDLE_WAIT, remaining);
    this.idleHandle = this.networkManager.waitForIdle({
      startTime: this.idleStartTime,
      timeoutMs: remaining,
      totalBudgetMs: this.timeoutMs,
      idleTimeMs: idleWindow,
      filter: this.buildIdleFilter(),
    });

    return this.idleHandle.promise.catch((error) => {
      if (this.abortError) throw this.abortError;
      throw error;
    });
  }

  private shouldRestartAfterFollowup(error: unknown): boolean {
    if (!this.pendingFollowupNavigation) return false;
    if (!(error instanceof Error)) return false;
    if (error.message !== "waitForIdle disposed") return false;
    this.pendingFollowupNavigation = false;
    return true;
  }

  private adoptNewMainLoader(loaderId: string): void {
    this.expectedLoaderId = loaderId;
    this.currentLoaderId = loaderId;
    this.idleStartTime = Date.now();
    if (this.waitUntil !== "networkidle") return;

    this.pendingFollowupNavigation = true;

    if (this.idleHandle) {
      const handle = this.idleHandle;
      this.idleHandle = null;
      void handle.promise.catch(() => {});
      handle.dispose();
    }
  }

  private buildIdleFilter(): (info: NetworkRequestInfo) => boolean {
    const loaderId = this.currentLoaderId;
    const mainFrameId = this.page.mainFrameId();

    return (info: NetworkRequestInfo) => {
      if (IGNORED_RESOURCE_TYPES.has(info.resourceType)) return false;

      if (loaderId && info.loaderId) {
        return info.loaderId === loaderId;
      }

      if (!info.loaderId && info.frameId) {
        return info.frameId === mainFrameId;
      }

      return true;
    };
  }
}


================================================
FILE: packages/core/lib/v3/understudy/locator.ts
================================================
// lib/v3/understudy/locator.ts
import { Protocol } from "devtools-protocol";
import * as fs from "fs";
import * as os from "os";
import * as path from "path";
import {
  locatorScriptBootstrap,
  locatorScriptGlobalRefs,
  locatorScriptSources,
} from "../dom/build/locatorScripts.generated.js";
import type { Frame } from "./frame.js";
import {
  FrameSelectorResolver,
  type SelectorQuery,
} from "./selectorResolver.js";
import {
  StagehandElementNotFoundError,
  StagehandInvalidArgumentError,
  StagehandLocatorError,
  ElementNotVisibleError,
} from "../types/public/sdkErrors.js";
import { normalizeInputFiles } from "./fileUploadUtils.js";
import { SetInputFilesArgument, MouseButton } from "../types/public/locator.js";
import { NormalizedFilePayload } from "../types/private/locator.js";

const MAX_REMOTE_UPLOAD_BYTES = 50 * 1024 * 1024; // 50MB guard copied from Playwright

/**
 * Locator
 *
 * Purpose:
 * A small, CDP-based element interaction helper scoped to a specific `Frame`.
 * It resolves a CSS/XPath selector inside the frame’s **isolated world**, and then
 * performs low-level actions (click, type, select) using DOM/Runtime/Input
 * protocol domains with minimal abstraction.
 *
 * Key change:
 * - Prefer **objectId**-based CDP calls (scroll, geometry) to avoid brittle
 *   frontend nodeId mappings. nodeId is resolved on a best-effort basis and
 *   returned for compatibility, but actions do not depend on it.
 *
 * Notes:
 * - Resolution is lazy: every action resolves the selector again.
 * - Uses `Page.createIsolatedWorld` so evaluation is isolated from page scripts.
 * - Releases remote objects (`Runtime.releaseObject`) where appropriate.
 */
export class Locator {
  private readonly selectorResolver: FrameSelectorResolver;

  private readonly selectorQuery: SelectorQuery;

  // -1 means "no explicit nth()"; default locator resolves to first match for actions.
  private readonly nthIndex: number;

  constructor(
    private readonly frame: Frame,
    private readonly selector: string,
    private readonly options?: { deep?: boolean; depth?: number },
    nthIndex: number = -1,
  ) {
    this.selectorResolver = new FrameSelectorResolver(this.frame);
    this.selectorQuery = FrameSelectorResolver.parseSelector(selector);
    const normalized = Number.isFinite(nthIndex) ? Math.floor(nthIndex) : -1;
    this.nthIndex = normalized < 0 ? -1 : normalized;
  }

  /** Return the owning Frame for this locator (typed accessor, no private access). */
  public getFrame(): Frame {
    return this.frame;
  }

  /**
   * Set files on an <input type="file"> element.
   *
   * Mirrors Playwright's Locator.setInputFiles basics:
   * - Accepts file path(s) or payload object(s) { name, mimeType, buffer }.
   * - Uses CDP DOM.setFileInputFiles under the hood.
   * - Best‑effort dispatches change/input via CDP (Chrome does by default).
   * - Passing an empty array clears the selection.
   */
  public async setInputFiles(files: SetInputFilesArgument): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();

    const tempFiles: string[] = [];

    try {
      // Validate element is an <input type="file">
      try {
        const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
          "Runtime.callFunctionOn",
          {
            objectId,
            functionDeclaration: locatorScriptSources.ensureFileInputElement,
            returnByValue: true,
          },
        );
        const ok = Boolean(res.result.value);
        if (!ok)
          throw new StagehandInvalidArgumentError(
            'Target is not an <input type="file"> element',
          );
      } catch (e) {
        throw new StagehandInvalidArgumentError(
          e instanceof Error
            ? e.message
            : "Unable to verify file input element",
        );
      }

      const normalized = await normalizeInputFiles(files);

      if (!normalized.length) {
        await session.send<never>("DOM.setFileInputFiles", {
          objectId,
          files: [],
        });
        return;
      }

      if (this.frame.isBrowserRemote()) {
        await this.assignFilesViaPayloadInjection(objectId, normalized);
        return;
      }

      const filePaths: string[] = [];
      for (const payload of normalized) {
        if (payload.absolutePath) {
          filePaths.push(payload.absolutePath);
          continue;
        }
        const ext = path.extname(payload.name);
        const tmp = path.join(
          os.tmpdir(),
          `stagehand-upload-${Date.now()}-${Math.random().toString(36).slice(2)}${ext}`,
        );
        await fs.promises.writeFile(tmp, payload.buffer);
        tempFiles.push(tmp);
        filePaths.push(tmp);
      }

      await session.send<never>("DOM.setFileInputFiles", {
        objectId,
        files: filePaths,
      });
    } finally {
      // Cleanup: release element and remove any temporary files we created
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
      for (const p of tempFiles) {
        try {
          await fs.promises.unlink(p);
        } catch {
          // ignore
        }
      }
    }
  }

  /**
   * Remote browser fallback: build File objects inside the page and attach them via JS.
   *
   * When Stagehand is driving a browser that cannot see the local filesystem (Browserbase,
   * remote CDP, etc.), CDP's DOM.setFileInputFiles would fail because Chrome can't reach
   * our temp files. Instead we base64-encode the payloads, send them into the page, and
   * let a DOM helper create File objects + dispatch change/input events.
   */
  private async assignFilesViaPayloadInjection(
    objectId: Protocol.Runtime.RemoteObjectId,
    files: NormalizedFilePayload[],
  ): Promise<void> {
    const session = this.frame.session;

    for (const payload of files) {
      if (payload.buffer.length > MAX_REMOTE_UPLOAD_BYTES) {
        throw new StagehandInvalidArgumentError(
          `setInputFiles(): file "${payload.name}" is larger than the 50MB limit for remote uploads`,
        );
      }
    }

    const serialized = files.map((payload) => ({
      name: payload.name,
      mimeType: payload.mimeType,
      lastModified: payload.lastModified,
      base64: payload.buffer.toString("base64"),
    }));

    const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
      "Runtime.callFunctionOn",
      {
        objectId,
        functionDeclaration:
          locatorScriptSources.assignFilePayloadsToInputElement,
        arguments: [
          {
            value: serialized,
          },
        ],
        returnByValue: true,
      },
    );

    const ok = Boolean(res.result?.value);
    if (!ok) {
      throw new StagehandInvalidArgumentError(
        "Unable to assign file payloads to remote input element",
      );
    }
  }

  /**
   * Return the DOM backendNodeId for this locator's target element.
   * Useful for identity comparisons without needing element handles.
   */
  async backendNodeId(): Promise<Protocol.DOM.BackendNodeId> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      await session.send("DOM.enable").catch(() => {});
      const { node } = await session.send<{ node: Protocol.DOM.Node }>(
        "DOM.describeNode",
        { objectId },
      );
      return node.backendNodeId as Protocol.DOM.BackendNodeId;
    } finally {
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /** Return how many nodes the current selector resolves to. */
  public async count(): Promise<number> {
    const session = this.frame.session;
    await session.send("Runtime.enable");
    await session.send("DOM.enable");
    return this.selectorResolver.count(this.selectorQuery);
  }

  /**
   * Return the center of the element's bounding box in the owning frame's viewport
   * (CSS pixels), rounded to integers. Scrolls into view best-effort.
   */
  public async centroid(): Promise<{ x: number; y: number }> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      await session
        .send("DOM.scrollIntoViewIfNeeded", { objectId })
        .catch(() => {});
      const box = await session.send<Protocol.DOM.GetBoxModelResponse>(
        "DOM.getBoxModel",
        { objectId },
      );
      if (!box.model) throw new ElementNotVisibleError(this.selector);
      const { cx, cy } = this.centerFromBoxContent(box.model.content);
      return { x: Math.round(cx), y: Math.round(cy) };
    } finally {
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /**
   * Highlight the element's bounding box using the CDP Overlay domain.
   * - Scrolls element into view best-effort.
   * - Shows a semi-transparent overlay briefly, then hides it.
   */
  public async highlight(options?: {
    durationMs?: number;
    borderColor?: { r: number; g: number; b: number; a?: number };
    contentColor?: { r: number; g: number; b: number; a?: number };
  }): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    const duration = Math.max(0, options?.durationMs ?? 800);

    const borderColor = options?.borderColor ?? { r: 255, g: 0, b: 0, a: 0.9 };
    const contentColor =
      options?.contentColor ?? ({ r: 255, g: 200, b: 0, a: 0.2 } as const);

    try {
      await session.send("Overlay.enable").catch(() => {});
      await session
        .send("DOM.scrollIntoViewIfNeeded", { objectId })
        .catch(() => {});

      // Prefer backendNodeId to keep highlight stable even if objectId is released.
      await session.send("DOM.enable").catch(() => {});
      let backendNodeId: Protocol.DOM.BackendNodeId | undefined;
      try {
        const { node } = await session.send<{ node: Protocol.DOM.Node }>(
          "DOM.describeNode",
          { objectId },
        );
        backendNodeId = node.backendNodeId as Protocol.DOM.BackendNodeId;
      } catch {
        backendNodeId = undefined;
      }

      const highlightConfig: Protocol.Overlay.HighlightConfig = {
        showInfo: false,
        showStyles: false,
        showRulers: false,
        showExtensionLines: false,
        borderColor,
        contentColor,
      } as Protocol.Overlay.HighlightConfig;

      const highlightOnce = async () => {
        await session.send<never>("Overlay.highlightNode", {
          ...(backendNodeId ? { backendNodeId } : { objectId }),
          highlightConfig,
        });
      };

      // Initial draw
      await highlightOnce();

      // Keep alive until duration elapses to resist overlay clears on mouse move/repaints
      if (duration > 0) {
        const start = Date.now();
        const tick = Math.min(300, Math.max(100, Math.floor(duration / 50)));
        while (Date.now() - start < duration) {
          await new Promise((r) => setTimeout(r, tick));
          try {
            await highlightOnce();
          } catch {
            // ignore transient errors
          }
        }
        await session.send<never>("Overlay.hideHighlight").catch(() => {});
      }
    } finally {
      // Releasing objectId should not affect highlight when using backendNodeId.
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /**
   * Move the mouse cursor to the element's visual center without clicking.
   * - Scrolls into view best-effort, resolves geometry, then dispatches a mouse move.
   */
  async hover(): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      await session
        .send("DOM.scrollIntoViewIfNeeded", { objectId })
        .catch(() => {});

      const box = await session.send<Protocol.DOM.GetBoxModelResponse>(
        "DOM.getBoxModel",
        { objectId },
      );
      if (!box.model) throw new ElementNotVisibleError(this.selector);
      const { cx, cy } = this.centerFromBoxContent(box.model.content);

      await session.send<never>("Input.dispatchMouseEvent", {
        type: "mouseMoved",
        x: cx,
        y: cy,
        button: "none",
      } as Protocol.Input.DispatchMouseEventRequest);
    } finally {
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /**
   * Click the element at its visual center.
   * Steps:
   *  1) Resolve selector to { objectId } in the frame world.
   *  2) Scroll into view via `DOM.scrollIntoViewIfNeeded({ objectId })`.
   *  3) Read geometry via `DOM.getBoxModel({ objectId })` → compute a center point.
   *  4) Synthesize mouse press + release via `Input.dispatchMouseEvent`.
   */
  async click(options?: {
    button?: MouseButton;
    clickCount?: number;
  }): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();

    const button = options?.button ?? "left";
    const clickCount = options?.clickCount ?? 1;

    try {
      // Scroll into view using objectId (avoids frontend nodeId dependence)
      await session.send("DOM.scrollIntoViewIfNeeded", { objectId });

      // Get geometry using objectId
      const box = await session.send<Protocol.DOM.GetBoxModelResponse>(
        "DOM.getBoxModel",
        { objectId },
      );
      if (!box.model) throw new ElementNotVisibleError(this.selector);
      const { cx, cy } = this.centerFromBoxContent(box.model.content);

      // Dispatch click events in a pipelined burst to reduce inter-click delay
      // from network/CPU jitter between round trips.
      const dispatches: Array<Promise<unknown>> = [];
      dispatches.push(
        session.send<never>("Input.dispatchMouseEvent", {
          type: "mouseMoved",
          x: cx,
          y: cy,
          button: "none",
        } as Protocol.Input.DispatchMouseEventRequest),
      );

      for (let i = 1; i <= clickCount; i++) {
        dispatches.push(
          session.send<never>("Input.dispatchMouseEvent", {
            type: "mousePressed",
            x: cx,
            y: cy,
            button,
            clickCount: i,
          } as Protocol.Input.DispatchMouseEventRequest),
        );
        dispatches.push(
          session.send<never>("Input.dispatchMouseEvent", {
            type: "mouseReleased",
            x: cx,
            y: cy,
            button,
            clickCount: i,
          } as Protocol.Input.DispatchMouseEventRequest),
        );
      }
      await Promise.all(dispatches);
    } finally {
      // release the element handle
      try {
        await session.send<never>("Runtime.releaseObject", { objectId });
      } catch {
        // If the context navigated or was destroyed (e.g., link opens new tab),
        // releaseObject may fail with -32000. Ignore as best-effort cleanup.
      }
    }
  }

  /**
   * Dispatch a DOM 'click' MouseEvent on the element itself.
   * - Does not synthesize real pointer input; directly dispatches an event.
   * - Useful for elements that rely on click handlers without needing hit-testing.
   */
  async sendClickEvent(options?: {
    bubbles?: boolean;
    cancelable?: boolean;
    composed?: boolean;
    detail?: number;
  }): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    const bubbles = options?.bubbles ?? true;
    const cancelable = options?.cancelable ?? true;
    const composed = options?.composed ?? true;
    const detail = options?.detail ?? 1;
    try {
      await session
        .send("DOM.scrollIntoViewIfNeeded", { objectId })
        .catch(() => {});
      await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.dispatchDomClick,
          arguments: [
            {
              value: { bubbles, cancelable, composed, detail },
            },
          ],
          returnByValue: true,
        },
      );
    } finally {
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /**
   * Scroll the element vertically to a given percentage (0–100).
   * - If the element is <html> or <body>, scrolls the window/document.
   * - Otherwise, scrolls the element itself via element.scrollTo.
   */
  async scrollTo(percent: number | string): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.scrollElementToPercent,
          arguments: [{ value: percent as unknown as number }],
          returnByValue: true,
        },
      );
    } finally {
      await session
        .send<never>("Runtime.releaseObject", { objectId })
        .catch(() => {});
    }
  }

  /**
   * Fill an input/textarea/contenteditable element.
   * Mirrors Playwright semantics: the DOM helper either applies the native
   * value setter (for special input types) or asks us to type text via the CDP
   * Input domain after focusing/selecting.
   */
  async fill(value: string): Promise<void> {
    const session = this.frame.session;
    // Use the bundled locator globals; the raw fill snippet depends on helper symbols.
    const fillDeclaration = `function(value) { ${locatorScriptBootstrap}; return ${locatorScriptGlobalRefs.fillElementValue}.call(this, value); }`;
    const { objectId } = await this.resolveNode();

    let releaseNeeded = true;

    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: fillDeclaration,
          arguments: [{ value }],
          returnByValue: true,
        },
      );
      if (res.exceptionDetails) {
        // prefer exception.description over text (eg "Uncaught")
        const message =
          res.exceptionDetails.exception?.description ??
          res.exceptionDetails.text ??
          "Unknown exception during locator().fill()";
        throw new StagehandLocatorError("Filling", this.selector, message);
      }

      const result = res.result.value as
        | { status?: string; reason?: string; value?: string }
        | null
        | undefined;
      const status =
        typeof result === "object" && result ? result.status : undefined;

      if (status === "done") {
        return;
      }

      if (status === "needsinput") {
        // Release the current handle before synthesizing keyboard input to avoid leaking it.
        await session
          .send<never>("Runtime.releaseObject", { objectId })
          .catch(() => {});
        releaseNeeded = false;

        const valueToType =
          typeof result?.value === "string" ? result.value : value;

        let prepared = false;
        try {
          const { objectId: prepObjectId } = await this.resolveNode();
          try {
            const prepRes =
              await session.send<Protocol.Runtime.CallFunctionOnResponse>(
                "Runtime.callFunctionOn",
                {
                  objectId: prepObjectId,
                  functionDeclaration:
                    locatorScriptSources.prepareElementForTyping,
                  returnByValue: true,
                },
              );
            prepared = Boolean(prepRes.result.value);
          } finally {
            await session
              .send<never>("Runtime.releaseObject", { objectId: prepObjectId })
              .catch(() => {});
          }
        } catch {
          // Ignore preparation failures; we'll fall back to typing best-effort.
        }

        if (!prepared && valueToType.length > 0) {
          await this.type(valueToType);
          return;
        }

        if (valueToType.length === 0) {
          // Simulate deleting the currently selected text to clear the field.
          await session.send<never>("Input.dispatchKeyEvent", {
            type: "keyDown",
            key: "Backspace",
            code: "Backspace",
            windowsVirtualKeyCode: 8,
            nativeVirtualKeyCode: 8,
          } as Protocol.Input.DispatchKeyEventRequest);
          await session.send<never>("Input.dispatchKeyEvent", {
            type: "keyUp",
            key: "Backspace",
            code: "Backspace",
            windowsVirtualKeyCode: 8,
            nativeVirtualKeyCode: 8,
          } as Protocol.Input.DispatchKeyEventRequest);
        } else {
          await session.send<never>("Input.insertText", { text: valueToType });
        }

        return;
      }

      if (status === "error") {
        const reason =
          typeof result?.reason === "string" && result.reason.length > 0
            ? result.reason
            : "Failed to fill element";
        throw new StagehandInvalidArgumentError(
          `Failed to fill element (${reason})`,
        );
      }

      // Backward compatibility: if no status is returned (older bundle), fall back to setter logic.
      if (!status) {
        await this.type(value);
      }
    } finally {
      if (releaseNeeded) {
        await session
          .send<never>("Runtime.releaseObject", { objectId })
          .catch(() => {});
      }
    }
  }

  /**
   * Type text into the element (focuses first).
   * - Focus via element.focus() in page JS (no DOM.focus(nodeId)).
   * - If no delay, uses `Input.insertText` for efficiency.
   * - With delay, synthesizes `keyDown`/`keyUp` per character.
   */
  async type(text: string, options?: { delay?: number }): Promise<void> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();

    try {
      // Focus using JS (avoids DOM.focus(nodeId))
      await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.focusElement,
          returnByValue: true,
        },
      );

      if (!options?.delay) {
        await session.send<never>("Input.insertText", { text });
        return;
      }

      for (const ch of text) {
        await session.send<never>("Input.dispatchKeyEvent", {
          type: "keyDown",
          text: ch,
          key: ch,
        } as Protocol.Input.DispatchKeyEventRequest);

        await session.send<never>("Input.dispatchKeyEvent", {
          type: "keyUp",
          text: ch,
          key: ch,
        } as Protocol.Input.DispatchKeyEventRequest);

        await new Promise((r) => setTimeout(r, options.delay));
      }
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Select one or more options on a `<select>` element.
   * Returns the values actually selected after the operation.
   */
  async selectOption(values: string | string[]): Promise<string[]> {
    const session = this.frame.session;
    const desired = Array.isArray(values) ? values : [values];
    const { objectId } = await this.resolveNode();

    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.selectElementOptions,
          arguments: [{ value: desired }],
          returnByValue: true,
        },
      );

      return (res.result.value as string[]) ?? [];
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return true if the element is attached and visible (rough heuristic).
   */
  async isVisible(): Promise<boolean> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.isElementVisible,
          returnByValue: true,
        },
      );
      return Boolean(res.result.value);
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return true if the element is an input[type=checkbox|radio] and is checked.
   * Also considers aria-checked for ARIA widgets.
   */
  async isChecked(): Promise<boolean> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.isElementChecked,
          returnByValue: true,
        },
      );
      return Boolean(res.result.value);
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return the element's input value (for input/textarea/select/contenteditable).
   */
  async inputValue(): Promise<string> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.readElementInputValue,
          returnByValue: true,
        },
      );
      return String(res.result.value ?? "");
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return the element's textContent (raw, not innerText).
   */
  async textContent(): Promise<string> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.readElementTextContent,
          returnByValue: true,
        },
      );
      return String(res.result.value ?? "");
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return the element's innerHTML string.
   */
  async innerHtml(): Promise<string> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.readElementInnerHTML,
          returnByValue: true,
        },
      );
      return String(res.result.value ?? "");
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return the element's innerText (layout-aware, visible text).
   */
  async innerText(): Promise<string> {
    const session = this.frame.session;
    const { objectId } = await this.resolveNode();
    try {
      const res = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
        "Runtime.callFunctionOn",
        {
          objectId,
          functionDeclaration: locatorScriptSources.readElementInnerText,
          returnByValue: true,
        },
      );
      return String(res.result.value ?? "");
    } finally {
      await session.send<never>("Runtime.releaseObject", { objectId });
    }
  }

  /**
   * Return a locator narrowed to the first match.
   */
  first(): Locator {
    return this.nth(0);
  }

  /** Return a locator narrowed to the element at the given zero-based index. */
  nth(index: number): Locator {
    const value = Number(index);
    if (!Number.isFinite(value) || value < 0) {
      throw new StagehandInvalidArgumentError(
        "locator().nth() expects a non-negative index",
      );
    }

    const nextIndex = Math.floor(value);
    if (nextIndex === this.nthIndex) {
      return this;
    }

    return new Locator(this.frame, this.selector, this.options, nextIndex);
  }

  // ---------- helpers ----------

  /**
   * Resolve `this.selector` within the frame to `{ objectId, nodeId? }`:
   * Delegates to a shared selector resolver so all selector logic stays in sync.
   */
  public async resolveNode(): Promise<{
    nodeId: Protocol.DOM.NodeId | null;
    objectId: Protocol.Runtime.RemoteObjectId;
  }> {
    const session = this.frame.session;

    await session.send("Runtime.enable");
    await session.send("DOM.enable");

    const index = this.nthIndex < 0 ? 0 : this.nthIndex;
    const resolved = await this.selectorResolver.resolveAtIndex(
      this.selectorQuery,
      index,
    );
    if (!resolved) {
      throw new StagehandElementNotFoundError([this.selector]);
    }

    return resolved;
  }

  /**
   * Resolve all matching nodes for this locator.
   * If the locator is narrowed via nth(), only that index is returned.
   */
  public async resolveNodesForMask(): Promise<
    Array<{
      nodeId: Protocol.DOM.NodeId | null;
      objectId: Protocol.Runtime.RemoteObjectId;
    }>
  > {
    const session = this.frame.session;

    await session.send("Runtime.enable");
    await session.send("DOM.enable");

    if (this.nthIndex >= 0) {
      const resolved = await this.selectorResolver.resolveAtIndex(
        this.selectorQuery,
        this.nthIndex,
      );
      if (!resolved) {
        throw new StagehandElementNotFoundError([this.selector]);
      }
      return [resolved];
    }

    const resolved = await this.selectorResolver.resolveAll(this.selectorQuery);
    if (!resolved.length) {
      throw new StagehandElementNotFoundError([this.selector]);
    }
    return resolved;
  }

  /** Compute a center point from a BoxModel content quad */
  private centerFromBoxContent(content: number[]): { cx: number; cy: number } {
    // content is [x1,y1, x2,y2, x3,y3, x4,y4]
    if (!content || content.length < 8) {
      throw new StagehandInvalidArgumentError("Invalid box model content quad");
    }
    const xs = [content[0], content[2], content[4], content[6]];
    const ys = [content[1], content[3], content[5], content[7]];
    const cx = (xs[0] + xs[1] + xs[2] + xs[3]) / 4;
    const cy = (ys[0] + ys[1] + ys[2] + ys[3]) / 4;
    return { cx, cy };
  }
}


================================================
FILE: packages/core/lib/v3/understudy/locatorInvocation.ts
================================================
import {
  locatorScriptBootstrap,
  locatorScriptGlobalRefs,
  type LocatorScriptName,
} from "../dom/build/locatorScripts.generated.js";

/**
 * Build an expression that injects the locator bundle (if needed) and invokes a
 * specific helper via its stable global reference. This keeps Runtime.evaluate
 * payloads tiny while guaranteeing our selector utilities are present in any
 * execution context.
 */
export function buildLocatorInvocation(
  name: LocatorScriptName,
  args: string[],
): string {
  const invocation = `${locatorScriptGlobalRefs[name]}(${args.join(", ")})`;
  return `(() => { ${locatorScriptBootstrap}; return ${invocation}; })()`;
}


================================================
FILE: packages/core/lib/v3/understudy/navigationResponseTracker.ts
================================================
/**
 * NavigationResponseTracker
 * -------------------------
 *
 * Tracks DevTools Protocol network events for a single navigation command so
 * Stagehand can surface a Playwright-like response object from `Page.goto` and
 * related APIs. The tracker listens for `Network.responseReceived` events that
 * correspond to the targeted document navigation, handles loader-id churn that
 * arises from redirects or preloading, and enriches the resulting
 * `Response` with extra header information. It also observes
 * `Network.loadingFinished` / `Network.loadingFailed` to fulfil the
 * `response.finished()` contract exposed to consumers.
 */

import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "./cdp.js";
import type { Page } from "./page.js";
import { Response } from "./response.js";

/**
 * Watches CDP events on a given session and resolves with the navigation's
 * primary document response once identified.
 */
export class NavigationResponseTracker {
  private readonly page: Page;
  private readonly session: CDPSessionLike;
  private readonly navigationCommandId: number;

  private expectedLoaderId: string | undefined;
  private selectedRequestId: string | null = null;
  private selectedResponse: Response | null = null;
  private acceptNextWithoutLoader = false;

  private responseResolved = false;
  private resolveResponse!: (value: Response | null) => void;
  private responsePromise: Promise<Response | null>;

  private readonly pendingResponsesByLoader = new Map<
    string,
    Protocol.Network.ResponseReceivedEvent
  >();
  private readonly pendingExtraInfo = new Map<
    string,
    Protocol.Network.ResponseReceivedExtraInfoEvent
  >();

  private readonly listeners: Array<{
    event: string;
    handler: (event: unknown) => void;
  }> = [];

  /**
   * Create a tracker bound to a specific navigation command. The tracker begins
   * listening for network events immediately so it should be constructed before
   * the navigation request is dispatched.
   */
  constructor(params: {
    page: Page;
    session: CDPSessionLike;
    navigationCommandId: number;
  }) {
    this.page = params.page;
    this.session = params.session;
    this.navigationCommandId = params.navigationCommandId;

    this.responsePromise = new Promise<Response | null>((resolve) => {
      this.resolveResponse = (value) => {
        if (this.responseResolved) return;
        this.responseResolved = true;
        resolve(value);
      };
    });

    this.installListeners();
  }

  /** Stop listening for CDP events and release any pending bookkeeping. */
  public dispose(): void {
    for (const { event, handler } of this.listeners) {
      this.session.off(event, handler as never);
    }
    this.listeners.length = 0;
    this.pendingResponsesByLoader.clear();
    this.pendingExtraInfo.clear();
  }

  /**
   * Hint the tracker with the loader id returned by `Page.navigate`. Chrome only
   * emits this once the browser begins navigating, so we store early responses
   * and match them once the loader id is known.
   */
  public setExpectedLoaderId(loaderId: string | undefined): void {
    if (!loaderId) return;
    this.expectedLoaderId = loaderId;
    const pending = this.pendingResponsesByLoader.get(loaderId);
    if (pending) {
      this.pendingResponsesByLoader.delete(loaderId);
      this.selectResponse(pending);
    }
  }

  /**
   * Some navigation APIs (reload/history traversal) do not provide a loader id
   * up front. This flag instructs the tracker to accept the next qualifying
   * document response even if no loader id has been announced yet.
   */
  public expectNavigationWithoutKnownLoader(): void {
    this.acceptNextWithoutLoader = true;
  }

  /**
   * Returns a promise that resolves with the matched response (or `null` when
   * no document response was observed).
   */
  public async navigationCompleted(): Promise<Response | null> {
    if (!this.responseResolved) {
      queueMicrotask(() => {
        if (!this.responseResolved) this.resolveResponse(null);
      });
    }
    return this.responsePromise;
  }

  /** Expose the raw response promise (mainly for tests). */
  public async response(): Promise<Response | null> {
    return this.responsePromise;
  }

  /** Register all CDP listeners relevant to navigation tracking. */
  private installListeners(): void {
    this.addListener("Network.responseReceived", (event) => {
      this.onResponseReceived(event as Protocol.Network.ResponseReceivedEvent);
    });
    this.addListener("Network.responseReceivedExtraInfo", (event) => {
      this.onResponseReceivedExtraInfo(
        event as Protocol.Network.ResponseReceivedExtraInfoEvent,
      );
    });
    this.addListener("Network.loadingFinished", (event) => {
      this.onLoadingFinished(event as Protocol.Network.LoadingFinishedEvent);
    });
    this.addListener("Network.loadingFailed", (event) => {
      this.onLoadingFailed(event as Protocol.Network.LoadingFailedEvent);
    });
  }

  /** Attach a CDP listener and track it for later disposal. */
  private addListener(event: string, handler: (event: unknown) => void): void {
    this.session.on(event, handler as never);
    this.listeners.push({ event, handler });
  }

  /** Handle the initial response payload for document navigations. */
  private onResponseReceived(
    event: Protocol.Network.ResponseReceivedEvent,
  ): void {
    if (!this.page.isCurrentNavigationCommand(this.navigationCommandId)) return;
    if (!event || !event.response) return;
    if (event.type !== "Document") return;
    if (event.frameId !== this.page.mainFrameId()) return;

    const loaderId = event.loaderId ?? "";
    if (this.acceptNextWithoutLoader) {
      this.acceptNextWithoutLoader = false;
      this.selectResponse(event);
      return;
    }

    if (this.expectedLoaderId) {
      if (loaderId && loaderId !== this.expectedLoaderId) {
        this.pendingResponsesByLoader.set(loaderId, event);
        return;
      }
      this.selectResponse(event);
      return;
    }

    if (loaderId) {
      this.pendingResponsesByLoader.set(loaderId, event);
      return;
    }

    this.selectResponse(event);
  }

  /** Merge auxiliary header information once Chrome exposes it. */
  private onResponseReceivedExtraInfo(
    event: Protocol.Network.ResponseReceivedExtraInfoEvent,
  ): void {
    if (!event || !event.requestId) return;
    if (this.selectedRequestId && event.requestId === this.selectedRequestId) {
      this.selectedResponse?.applyExtraInfo(event);
      return;
    }
    this.pendingExtraInfo.set(event.requestId, event);
  }

  /** Resolve the response's finished promise when the request completes. */
  private onLoadingFinished(
    event: Protocol.Network.LoadingFinishedEvent,
  ): void {
    if (!event || !event.requestId) return;
    if (event.requestId !== this.selectedRequestId) return;
    this.selectedResponse?.markFinished(null);
  }

  /** Resolve the response's finished promise with an error on failure. */
  private onLoadingFailed(event: Protocol.Network.LoadingFailedEvent): void {
    // Ignore malformed events or ones without a request id
    if (!event || !event.requestId) return;
    // Only the tracked document request should toggle the response state
    if (event.requestId !== this.selectedRequestId) return;
    // Surface Chrome's failure text through response.finished()
    const errorText = event.errorText || "Navigation request failed";
    this.selectedResponse?.markFinished(new Error(errorText));
  }

  /**
   * Create the `Response` wrapper for the chosen document response and
   * resolve awaiting consumers. Subsequent events flesh out the header/body
   * helpers and mark the request as finished.
   */
  private selectResponse(event: Protocol.Network.ResponseReceivedEvent): void {
    if (event.loaderId) {
      this.pendingResponsesByLoader.delete(event.loaderId);
    }

    if (this.responseResolved) return;
    if (this.selectedResponse) return;

    const protocol = event.response?.protocol?.toLowerCase() ?? "";
    const url = event.response?.url ?? "";
    const isDataUrl = protocol === "data" || url.startsWith("data:");
    const isAboutUrl = protocol === "about" || url.startsWith("about:");

    if (isDataUrl || isAboutUrl) {
      this.pendingExtraInfo.delete(event.requestId);
      this.selectedRequestId = null;
      this.selectedResponse = null;
      this.resolveResponse(null);
      return;
    }

    const response = new Response({
      page: this.page,
      session: this.session,
      requestId: event.requestId,
      frameId: event.frameId,
      loaderId: event.loaderId,
      response: event.response,
      fromServiceWorker: Boolean(event.response?.fromServiceWorker),
    });

    this.selectedRequestId = event.requestId;
    this.selectedResponse = response;

    const extraInfo = this.pendingExtraInfo.get(event.requestId);
    if (extraInfo) {
      response.applyExtraInfo(extraInfo);
      this.pendingExtraInfo.delete(event.requestId);
    }

    this.resolveResponse(response);
  }
}


================================================
FILE: packages/core/lib/v3/understudy/networkManager.ts
================================================
import type { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "./cdp.js";
import {
  DEFAULT_IDLE_WAIT,
  IGNORED_RESOURCE_TYPES,
  NetworkObserver,
  NetworkRequestInfo,
  WaitForIdleHandle,
  WaitForIdleOptions,
} from "../types/private/network.js";

/**
 * Cross-session network tracker.
 *
 * Centralises network bookkeeping for a Page: every CDP session (top-level and OOPIF)
 * funnels `Network.*` events through here so higher-level waiters can reason about
 * in-flight requests across the entire frame tree. The manager exposes a simple
 * observer interface plus a "wait until idle" helper that resolves once no filtered
 * requests remain for a quiet window.
 */

/**
 * Aggregates network information for all CDP sessions owned by a Page.
 */
export class NetworkManager {
  private readonly sessions = new Map<
    string,
    {
      session: CDPSessionLike;
      detach: () => void;
    }
  >();

  private readonly observers = new Set<NetworkObserver>();

  private readonly requests = new Map<string, NetworkRequestInfo>();

  private readonly documentRequestsByFrame = new Map<string, string>();

  /**
   * Begin tracking network traffic for a CDP session (top-level or OOPIF).
   * Safe to call multiple times; duplicate registrations are ignored.
   */
  public trackSession(session: CDPSessionLike): void {
    const sid = this.sessionKey(session);
    if (this.sessions.has(sid)) return;

    const onRequest = (evt: Protocol.Network.RequestWillBeSentEvent) => {
      if (!evt || !evt.requestId) return;

      const info: NetworkRequestInfo = {
        sessionId: sid,
        requestId: evt.requestId,
        requestKey: this.requestKey(sid, evt.requestId),
        frameId: evt.frameId ?? undefined,
        loaderId: evt.loaderId ?? undefined,
        url: evt.request?.url,
        timestamp: Date.now(),
        resourceType: evt.type,
        documentRequest: evt.type === "Document",
      };

      this.requests.set(info.requestKey, info);
      if (info.documentRequest && info.frameId) {
        this.documentRequestsByFrame.set(info.frameId, info.requestKey);
      }

      this.emitStart(info);
    };

    const finish = (reqId: string) => {
      const key = this.requestKey(sid, reqId);
      const stored = this.requests.get(key);
      if (stored?.frameId) {
        this.documentRequestsByFrame.delete(stored.frameId);
      }
      const info: NetworkRequestInfo = stored ?? {
        sessionId: sid,
        requestId: reqId,
        requestKey: key,
        timestamp: Date.now(),
        documentRequest: false,
      };
      this.requests.delete(key);
      this.emitFinish(info);
    };

    const fail = (reqId: string) => {
      const key = this.requestKey(sid, reqId);
      const stored = this.requests.get(key);
      if (stored?.frameId) {
        this.documentRequestsByFrame.delete(stored.frameId);
      }
      const info: NetworkRequestInfo = stored ?? {
        sessionId: sid,
        requestId: reqId,
        requestKey: key,
        timestamp: Date.now(),
        documentRequest: false,
      };
      this.requests.delete(key);
      this.emitFailure(info);
    };

    const onFinished = (evt: { requestId: string }) => {
      if (!evt?.requestId) return;
      finish(evt.requestId);
    };

    const onFailed = (evt: Protocol.Network.LoadingFailedEvent) => {
      if (!evt?.requestId) return;
      fail(evt.requestId);
    };

    const onResponse = (evt: Protocol.Network.ResponseReceivedEvent) => {
      if (!evt?.requestId) return;
      const url = evt.response?.url ?? "";
      if (url.startsWith("data:")) finish(evt.requestId);
    };

    const onFrameStopped = (evt: Protocol.Page.FrameStoppedLoadingEvent) => {
      if (!evt?.frameId) return;
      const key = this.documentRequestsByFrame.get(evt.frameId);
      if (!key) return;
      const stored = this.requests.get(key);
      if (!stored) {
        this.documentRequestsByFrame.delete(evt.frameId);
        return;
      }
      this.requests.delete(key);
      this.documentRequestsByFrame.delete(evt.frameId);
      this.emitFinish({ ...stored, timestamp: Date.now() });
    };

    session.on("Network.requestWillBeSent", onRequest);
    session.on("Network.loadingFinished", onFinished);
    session.on("Network.loadingFailed", onFailed);
    session.on("Network.requestServedFromCache", onFinished);
    session.on("Network.responseReceived", onResponse);
    session.on("Page.frameStoppedLoading", onFrameStopped);

    void session.send("Network.enable").catch(() => {});
    void session.send("Page.enable").catch(() => {});

    this.sessions.set(sid, {
      session,
      detach: () => {
        session.off("Network.requestWillBeSent", onRequest);
        session.off("Network.loadingFinished", onFinished);
        session.off("Network.loadingFailed", onFailed);
        session.off("Network.requestServedFromCache", onFinished);
        session.off("Network.responseReceived", onResponse);
        session.off("Page.frameStoppedLoading", onFrameStopped);
      },
    });
  }

  /**
   * Stop tracking a session and discard any inflight bookkeeping owned by it.
   */
  public untrackSession(rawSessionId: string | undefined): void {
    const sid = rawSessionId ?? "__main__";
    const entry = this.sessions.get(sid);
    if (!entry) return;
    entry.detach();
    this.sessions.delete(sid);

    for (const key of [...this.requests.keys()]) {
      if (key.startsWith(`${sid}:`)) this.requests.delete(key);
    }

    for (const [frameId, key] of [...this.documentRequestsByFrame.entries()]) {
      if (key.startsWith(`${sid}:`)) {
        this.documentRequestsByFrame.delete(frameId);
      }
    }
  }

  /**
   * Register a passive observer for request lifecycle notifications.
   * Returns a disposer that removes the observer.
   */
  public addObserver(observer: NetworkObserver): () => void {
    this.observers.add(observer);
    return () => {
      this.observers.delete(observer);
    };
  }

  /**
   * Resolve once no (filtered) requests are in flight for the given quiet window.
   * The waiter automatically unregisters itself on completion or timeout.
   */
  public waitForIdle(options: WaitForIdleOptions): WaitForIdleHandle {
    const startTime = options.startTime ?? Date.now();
    const idleTimeMs = options.idleTimeMs ?? DEFAULT_IDLE_WAIT;
    const timeoutMs = options.timeoutMs;
    const remainingBudgetMs = Number.isFinite(timeoutMs)
      ? timeoutMs
      : undefined;
    const originalBudgetMs = Number.isFinite(options.totalBudgetMs ?? NaN)
      ? (options.totalBudgetMs as number)
      : remainingBudgetMs;

    const filter =
      options.filter ??
      ((info: NetworkRequestInfo) => {
        return !IGNORED_RESOURCE_TYPES.has(info.resourceType);
      });

    const tracked = new Set<string>();
    let idleTimer: ReturnType<typeof setTimeout> | null = null;
    let timeoutTimer: ReturnType<typeof setTimeout> | null = null;
    let settled = false;

    let resolveFn: (() => void) | null = null;
    let rejectFn: ((error: Error) => void) | null = null;

    const cleanup = (error?: Error) => {
      if (settled) return;
      settled = true;
      if (idleTimer) clearTimeout(idleTimer);
      if (timeoutTimer) clearTimeout(timeoutTimer);
      removeObserver();
      tracked.clear();
      if (error) {
        rejectFn?.(error);
      } else {
        resolveFn?.();
      }
    };

    const maybeIdle = () => {
      if (settled) return;
      if (tracked.size === 0) {
        if (!idleTimer) {
          idleTimer = setTimeout(() => {
            cleanup();
          }, idleTimeMs);
        }
      } else if (idleTimer) {
        clearTimeout(idleTimer);
        idleTimer = null;
      }
    };

    const observer: NetworkObserver = {
      onRequestStarted: (info) => {
        if (settled) return;
        if (info.timestamp < startTime) return;
        if (!filter(info)) return;
        tracked.add(info.requestKey);
        if (idleTimer) {
          clearTimeout(idleTimer);
          idleTimer = null;
        }
      },
      onRequestFinished: (info) => {
        if (settled) return;
        if (!tracked.delete(info.requestKey)) return;
        maybeIdle();
      },
      onRequestFailed: (info) => {
        if (settled) return;
        if (!tracked.delete(info.requestKey)) return;
        maybeIdle();
      },
    };

    const removeObserver = this.addObserver(observer);

    const promise = new Promise<void>((resolve, reject) => {
      resolveFn = resolve;
      rejectFn = reject;
    });

    // Trigger initial idle check so that we still respect the quiet window
    maybeIdle();

    if (Number.isFinite(timeoutMs)) {
      timeoutTimer = setTimeout(
        () => {
          const elapsed = Date.now() - startTime;
          const message =
            originalBudgetMs !== undefined
              ? `networkidle timed out after ${originalBudgetMs}ms`
              : `networkidle timed out after ${elapsed}ms`;
          cleanup(new Error(message));
        },
        Math.max(0, timeoutMs),
      );
    }

    return {
      promise,
      dispose: () => cleanup(new Error("waitForIdle disposed")),
    };
  }

  /**
   * Tear down all session listeners and clear observers/bookkeeping.
   */
  public dispose(): void {
    for (const { detach } of this.sessions.values()) {
      detach();
    }
    this.sessions.clear();
    this.observers.clear();
    this.requests.clear();
    this.documentRequestsByFrame.clear();
  }

  /** Fan-out helper when a tracked request starts. */
  private emitStart(info: NetworkRequestInfo): void {
    for (const obs of this.observers) {
      obs.onRequestStarted(info);
    }
  }

  /** Fan-out helper when a tracked request completes successfully. */
  private emitFinish(info: NetworkRequestInfo): void {
    for (const obs of this.observers) {
      obs.onRequestFinished(info);
    }
  }

  /** Fan-out helper when a tracked request fails mid-flight. */
  private emitFailure(info: NetworkRequestInfo): void {
    for (const obs of this.observers) {
      obs.onRequestFailed(info);
    }
  }

  /** Compute a stable key for a session (falls back to synthetic root id). */
  private sessionKey(session: CDPSessionLike): string {
    return session.id ?? "__main__";
  }

  /** Compose the unique key for tracking a request under a session. */
  private requestKey(sessionId: string, requestId: string): string {
    return `${sessionId}:${requestId}`;
  }
}


================================================
FILE: packages/core/lib/v3/understudy/page.ts
================================================
import { Protocol } from "devtools-protocol";
import { promises as fs } from "fs";
import { v3Logger } from "../logger.js";
import { FlowLogger } from "../flowlogger/FlowLogger.js";
import type { CDPSessionLike } from "./cdp.js";
import { CdpConnection } from "./cdp.js";
import { Frame } from "./frame.js";
import { FrameLocator } from "./frameLocator.js";
import { deepLocatorFromPage, resolveLocatorTarget } from "./deepLocator.js";
import {
  captureHybridSnapshot,
  resolveXpathForLocation,
} from "./a11y/snapshot/index.js";
import { FrameRegistry } from "./frameRegistry.js";
import { executionContexts } from "./executionContextRegistry.js";
import {
  LoadState,
  SnapshotResult,
  PageSnapshotOptions,
} from "../types/public/page.js";
import { NetworkManager } from "./networkManager.js";
import { LifecycleWatcher } from "./lifecycleWatcher.js";
import { NavigationResponseTracker } from "./navigationResponseTracker.js";
import { Response, isSerializableResponse } from "./response.js";
import { ConsoleMessage, ConsoleListener } from "./consoleMessage.js";
import type { StagehandAPIClient } from "../api.js";
import {
  LocalBrowserLaunchOptions,
  StagehandSetExtraHTTPHeadersError,
  StagehandSnapshotError,
} from "../types/public/index.js";
import type { Locator } from "./locator.js";
import {
  StagehandInvalidArgumentError,
  StagehandEvalError,
} from "../types/public/sdkErrors.js";
import { normalizeInitScriptSource } from "./initScripts.js";
import { buildLocatorInvocation } from "./locatorInvocation.js";
import type {
  ScreenshotAnimationsOption,
  ScreenshotCaretOption,
  ScreenshotOptions,
  ScreenshotScaleOption,
} from "../types/public/screenshotTypes.js";
import {
  applyMaskOverlays,
  applyStyleToFrames,
  collectFramesForScreenshot,
  computeScreenshotScale,
  disableAnimations,
  hideCaret,
  normalizeScreenshotClip,
  runScreenshotCleanups,
  setTransparentBackground,
  type ScreenshotCleanup,
} from "./screenshotUtils.js";
import { InitScriptSource } from "../types/private/index.js";
import { withTimeout } from "../timeoutConfig.js";

/**
 * Page
 *
 * One instance per **top-level target**. It owns:
 *  - the top-level CDP session (for the page target)
 *  - all adopted OOPIF child sessions (Target.attachToTarget with flatten: true)
 *  - a **FrameRegistry** that is the single source of truth for BOTH:
 *      • frame topology (parent/children, root swaps, last-seen CDP Frame)
 *      • frame → session ownership (which session owns which frameId)
 *
 * Page exposes convenient APIs (goto/reload/url/screenshot/locator),
 * and simple bridges that Context uses to feed Page/Target events in.
 */

const LIFECYCLE_NAME: Record<LoadState, string> = {
  load: "load",
  domcontentloaded: "DOMContentLoaded",
  networkidle: "networkIdle",
};

export class Page {
  /** Every CDP child session this page owns (top-level + adopted OOPIF sessions). */
  private readonly sessions = new Map<string, CDPSessionLike>(); // sessionId -> session

  /** Unified truth for frame topology + ownership. */
  private readonly registry: FrameRegistry;

  /** A convenience wrapper bound to the current main frame id (top-level session). */
  private mainFrameWrapper: Frame;

  /** Compact ordinal per frameId (used by snapshot encoding). */
  private frameOrdinals = new Map<string, number>();
  private nextOrdinal = 0;

  /** cache Frames per frameId so everyone uses the same one */
  private readonly frameCache = new Map<string, Frame>();
  private readonly browserIsRemote: boolean;

  /** Stable id for Frames created by this Page (use top-level TargetId). */
  private readonly pageId: string;
  /** Cached current URL for synchronous page.url() */
  private _currentUrl: string = "about:blank";

  private navigationCommandSeq = 0;
  private latestNavigationCommandId = 0;

  private readonly networkManager: NetworkManager;
  /** Optional API client for routing page operations to the API */
  private readonly apiClient: StagehandAPIClient | null = null;
  private readonly consoleListeners = new Set<ConsoleListener>();
  private readonly consoleHandlers = new Map<
    string,
    (evt: Protocol.Runtime.ConsoleAPICalledEvent) => void
  >();
  /** Document-start scripts installed across every session this page owns. */
  private readonly initScripts: string[] = [];
  private extraHTTPHeaders: Record<string, string>;

  private constructor(
    private readonly conn: CdpConnection,
    private readonly mainSession: CDPSessionLike,
    private readonly _targetId: string,
    mainFrameId: string,
    apiClient?: StagehandAPIClient | null,
    browserIsRemote = false,
  ) {
    this.pageId = _targetId;
    this.apiClient = apiClient ?? null;
    this.browserIsRemote = browserIsRemote;

    // own the main session
    if (mainSession.id) this.sessions.set(mainSession.id, mainSession);

    // initialize registry with root/main frame id
    this.registry = new FrameRegistry(_targetId, mainFrameId);

    // main-frame wrapper is always bound to the **top-level** session
    this.mainFrameWrapper = new Frame(
      this.mainSession,
      mainFrameId,
      this.pageId,
      this.browserIsRemote,
    );

    this.networkManager = new NetworkManager();
    this.networkManager.trackSession(this.mainSession);
  }

  // Send a single init script to a specific CDP session.
  private async installInitScriptOnSession(
    session: CDPSessionLike,
    source: string,
  ): Promise<void> {
    await session.send("Page.addScriptToEvaluateOnNewDocument", {
      source: source,
    });
  }

  // Replay every previously registered init script onto a newly adopted session.
  private async applyInitScriptsToSession(
    session: CDPSessionLike,
  ): Promise<void> {
    for (const source of this.initScripts) {
      await this.installInitScriptOnSession(session, source);
    }
  }

  // Register a new init script and fan it out to all active sessions for this page.
  public async registerInitScript(source: string): Promise<void> {
    if (this.initScripts.includes(source)) return;
    this.initScripts.push(source);

    const installs: Array<Promise<void>> = [];
    installs.push(this.installInitScriptOnSession(this.mainSession, source));
    for (const session of this.sessions.values()) {
      if (session === this.mainSession) continue;
      installs.push(this.installInitScriptOnSession(session, source));
    }
    await Promise.all(installs);
  }

  // Seed an init script without re-installing it on the current sessions.
  public seedInitScript(source: string): void {
    if (this.initScripts.includes(source)) return;
    this.initScripts.push(source);
  }

  // --- Optional visual cursor overlay management ---
  private cursorEnabled = false;
  private async ensureCursorScript(): Promise<void> {
    const script = `(() => {
      const ID = '__v3_cursor_overlay__';
      const state = { el: null, last: null };
      // Expose API early so move() calls before install are buffered
      try {
        if (!window.__v3Cursor || !window.__v3Cursor.__installed) {
          const api = {
            __installed: false,
            move(x, y) {
              if (state.el) {
                state.el.style.left = Math.max(0, x) + 'px';
                state.el.style.top = Math.max(0, y) + 'px';
              } else {
                state.last = [x, y];
              }
            },
            show() { if (state.el) state.el.style.display = 'block'; },
            hide() { if (state.el) state.el.style.display = 'none'; },
          };
          window.__v3Cursor = api;
        }
      } catch {}

      function install() {
        try {
          if (state.el) return; // already installed
          let el = document.getElementById(ID);
          if (!el) {
            const root = document.documentElement || document.body || document.head;
            if (!root) { setTimeout(install, 50); return; }
            el = document.createElement('div');
            el.id = ID;
            el.style.position = 'fixed';
            el.style.left = '0px';
            el.style.top = '0px';
            el.style.width = '16px';
            el.style.height = '24px';
            el.style.zIndex = '2147483647';
            el.style.pointerEvents = 'none';
            el.style.userSelect = 'none';
            el.style.mixBlendMode = 'normal';
            el.style.contain = 'layout style paint';
            el.style.willChange = 'transform,left,top';
            el.innerHTML = '<svg xmlns="http://www.w3.org/2000/svg" width="16" height="24" viewBox="0 0 16 24"><path d="M1 0 L1 22 L6 14 L15 14 Z" fill="black" stroke="white" stroke-width="0.7"/></svg>';
            root.appendChild(el);
          }
          state.el = el;
          try { window.__v3Cursor.__installed = true; } catch {}
          if (state.last) {
            window.__v3Cursor.move(state.last[0], state.last[1]);
            state.last = null;
          }
        } catch {}
      }

      if (document.readyState === 'complete' || document.readyState === 'interactive') {
        install();
      } else {
        document.addEventListener('DOMContentLoaded', install, { once: true });
        setTimeout(install, 100);
      }
    })();`;

    // Ensure future documents get the cursor at doc-start
    await this.mainSession
      .send("Page.addScriptToEvaluateOnNewDocument", { source: script })
      .catch(() => {});
    // Inject into current document now
    await this.mainSession
      .send("Runtime.evaluate", {
        expression: script,
        includeCommandLineAPI: false,
      })
      .catch(() => {});
  }

  public async enableCursorOverlay(): Promise<void> {
    if (this.cursorEnabled) return;
    await this.ensureCursorScript();
    this.cursorEnabled = true;
  }

  private async updateCursor(x: number, y: number): Promise<void> {
    if (!this.cursorEnabled) return;
    try {
      await this.mainSession.send("Runtime.evaluate", {
        expression: `typeof window.__v3Cursor!=="undefined"&&window.__v3Cursor.move(${Math.round(x)}, ${Math.round(y)})`,
      });
    } catch {
      //
    }
  }

  public async addInitScript<Arg>(
    script: InitScriptSource<Arg>,
    arg?: Arg,
  ): Promise<void> {
    const source = await normalizeInitScriptSource(
      script,
      arg,
      "page.addInitScript",
    );
    await this.registerInitScript(source);
  }

  /**
   * Factory: create Page and seed registry with the shallow tree from Page.getFrameTree.
   * Assumes Page domain is already enabled on the session passed in.
   */
  static async create(
    conn: CdpConnection,
    session: CDPSessionLike,
    targetId: string,
    apiClient?: StagehandAPIClient | null,
    localBrowserLaunchOptions?: LocalBrowserLaunchOptions | null,
    browserIsRemote = false,
  ): Promise<Page> {
    // Context already issues Page.enable + lifecycle enable before resume.
    // Re-issue here only as best-effort and do not block page registration on
    // their acknowledgements; some remote CDP backends can delay these replies
    // long after the target is otherwise ready.
    void session.send("Page.enable").catch(() => {});
    void session
      .send("Page.setLifecycleEventsEnabled", { enabled: true })
      .catch(() => {});
    const { frameTree } = await session.send<{
      frameTree: Protocol.Page.FrameTree;
    }>("Page.getFrameTree");
    const mainFrameId = frameTree.frame.id;

    const page = new Page(
      conn,
      session,
      targetId,
      mainFrameId,
      apiClient,
      browserIsRemote,
    );
    // Seed current URL from initial frame tree
    try {
      page._currentUrl = String(frameTree?.frame?.url ?? page._currentUrl);
      if (localBrowserLaunchOptions?.viewport) {
        await page.setViewportSize(
          localBrowserLaunchOptions.viewport.width,
          localBrowserLaunchOptions.viewport.height,
          {
            deviceScaleFactor: localBrowserLaunchOptions.deviceScaleFactor ?? 1,
          },
        );
      }
    } catch {
      // ignore
    }

    // Seed topology + ownership for nodes known at creation time.
    page.registry.seedFromFrameTree(session.id ?? "root", frameTree);

    return page;
  }

  // ---------------- Event-driven updates from Context ----------------

  /**
   * Parent/child session emitted a `frameAttached`.
   * Topology update + ownership stamped to **emitting session**.
   */
  public onFrameAttached(
    frameId: string,
    parentId: string | null,
    session: CDPSessionLike,
  ): void {
    this.ensureOrdinal(frameId);
    this.registry.onFrameAttached(frameId, parentId, session.id ?? "root");
    // Cache is keyed by frameId → invalidate to ensure future frameForId resolves with latest owner
    this.frameCache.delete(frameId);
  }

  /**
   * Parent/child session emitted a `frameDetached`.
   */
  public onFrameDetached(
    frameId: string,
    reason: "remove" | "swap" | string = "remove",
  ): void {
    this.registry.onFrameDetached(frameId, reason);
    this.frameCache.delete(frameId);
  }

  /**
   * Parent/child session emitted a `frameNavigated`.
   * Topology + ownership update. Handles root swaps.
   */
  public onFrameNavigated(
    frame: Protocol.Page.Frame,
    session: CDPSessionLike,
  ): void {
    const prevRoot = this.mainFrameId();
    this.registry.onFrameNavigated(frame, session.id ?? "root");

    // If the root changed, keep the convenience wrapper in sync
    const newRoot = this.mainFrameId();
    if (newRoot !== prevRoot) {
      const oldOrd = this.frameOrdinals.get(prevRoot) ?? 0;
      this.frameOrdinals.set(newRoot, oldOrd);
      this.mainFrameWrapper = new Frame(
        this.mainSession,
        newRoot,
        this.pageId,
        this.browserIsRemote,
      );
    }

    // Update cached URL if this navigation pertains to the current main frame
    if (frame.id === this.mainFrameId()) {
      try {
        // Prefer frame.url; fallback keeps previous value
        this._currentUrl = String(
          (frame as { url?: string })?.url ?? this._currentUrl,
        );
      } catch {
        // ignore
      }
    }

    // Invalidate the cached Frame for this id (session may have changed)
    this.frameCache.delete(frame.id);
  }

  public onNavigatedWithinDocument(
    frameId: string,
    url: string,
    session: CDPSessionLike,
  ): void {
    const normalized = String(url ?? "").trim();
    if (!normalized) return;

    this.registry.onNavigatedWithinDocument(
      frameId,
      normalized,
      session.id ?? "root",
    );

    if (frameId === this.mainFrameId()) {
      this._currentUrl = normalized;
    }
  }

  /**
   * An OOPIF child session whose **main** frame id equals the parent iframe’s frameId
   * has been attached; adopt the session into this Page and seed ownership for its subtree.
   */
  public adoptOopifSession(
    childSession: CDPSessionLike,
    childMainFrameId: string,
  ): void {
    if (childSession.id) this.sessions.set(childSession.id, childSession);

    this.networkManager.trackSession(childSession);
    if (this.extraHTTPHeaders)
      void this.applyExtraHTTPHeadersToSession(
        childSession,
        this.extraHTTPHeaders,
      ).catch(() => {});

    void this.applyInitScriptsToSession(childSession).catch(() => {});

    if (this.consoleListeners.size > 0) {
      this.installConsoleTap(childSession);
    }

    // session will start emitting its own page events; mark ownership seed now
    this.registry.adoptChildSession(
      childSession.id ?? "child",
      childMainFrameId,
    );
    this.frameCache.delete(childMainFrameId);

    // Bridge events from the child session to keep registry in sync
    childSession.on<Protocol.Page.FrameNavigatedEvent>(
      "Page.frameNavigated",
      (evt) => {
        this.onFrameNavigated(evt.frame, childSession);
      },
    );
    childSession.on<Protocol.Page.FrameAttachedEvent>(
      "Page.frameAttached",
      (evt) => {
        this.onFrameAttached(
          evt.frameId,
          evt.parentFrameId ?? null,
          childSession,
        );
      },
    );
    childSession.on<Protocol.Page.FrameDetachedEvent>(
      "Page.frameDetached",
      (evt) => {
        this.onFrameDetached(evt.frameId, evt.reason ?? "remove");
      },
    );

    // One-shot seed the child's subtree ownership from its current tree
    void (async () => {
      try {
        await childSession.send("Page.enable").catch(() => {});
        let { frameTree } =
          await childSession.send<Protocol.Page.GetFrameTreeResponse>(
            "Page.getFrameTree",
          );

        // Normalize: ensure the child’s reported root id matches our known main id
        if (frameTree.frame.id !== childMainFrameId) {
          frameTree = {
            ...frameTree,
            frame: { ...frameTree.frame, id: childMainFrameId },
          };
        }

        this.registry.seedFromFrameTree(childSession.id ?? "child", frameTree);
      } catch {
        // If snapshot races, live events will still converge the registry.
      }
    })();
  }

  /** Detach an adopted child session and prune its subtree */
  public detachOopifSession(sessionId: string): void {
    // Find which frames were owned by this session and prune by tree starting from each root.
    for (const fid of this.registry.framesForSession(sessionId)) {
      this.registry.onFrameDetached(fid, "remove");
      this.frameCache.delete(fid);
    }
    this.teardownConsoleTap(sessionId);
    this.sessions.delete(sessionId);
    this.networkManager.untrackSession(sessionId);
  }

  // ---------------- Ownership helpers / lookups ----------------

  /** Return the owning CDP session for a frameId (falls back to main session) */
  public getSessionForFrame(frameId: string): CDPSessionLike {
    const sid = this.registry.getOwnerSessionId(frameId);
    if (!sid) return this.mainSession;
    return this.sessions.get(sid) ?? this.mainSession;
  }

  /** Always returns a Frame bound to the owning session */
  public frameForId(frameId: string): Frame {
    const hit = this.frameCache.get(frameId);
    if (hit) return hit;

    const sess = this.getSessionForFrame(frameId);
    const f = new Frame(sess, frameId, this.pageId, this.browserIsRemote);
    this.frameCache.set(frameId, f);
    return f;
  }

  /** Expose a session by id (used by snapshot to resolve session id -> session) */
  public getSessionById(id: string): CDPSessionLike | undefined {
    return this.sessions.get(id);
  }

  public registerSessionForNetwork(session: CDPSessionLike): void {
    this.networkManager.trackSession(session);
  }

  public unregisterSessionForNetwork(sessionId: string | undefined): void {
    this.networkManager.untrackSession(sessionId);
  }

  public on(event: "console", listener: ConsoleListener): Page {
    if (event !== "console") {
      throw new StagehandInvalidArgumentError(`Unsupported event: ${event}`);
    }

    const firstListener = this.consoleListeners.size === 0;
    this.consoleListeners.add(listener);

    if (firstListener) {
      this.ensureConsoleTaps();
    }

    return this;
  }

  public once(event: "console", listener: ConsoleListener): Page {
    if (event !== "console") {
      throw new StagehandInvalidArgumentError(`Unsupported event: ${event}`);
    }

    const wrapper: ConsoleListener = (message) => {
      this.off("console", wrapper);
      listener(message);
    };

    return this.on("console", wrapper);
  }

  public off(event: "console", listener: ConsoleListener): Page {
    if (event !== "console") {
      throw new StagehandInvalidArgumentError(`Unsupported event: ${event}`);
    }

    this.consoleListeners.delete(listener);

    if (this.consoleListeners.size === 0) {
      this.removeAllConsoleTaps();
    }

    return this;
  }

  // ---------------- MAIN APIs ----------------

  public targetId(): string {
    return this._targetId;
  }

  /**
   * Send a CDP command through the main session.
   * Allows external consumers to execute arbitrary Chrome DevTools Protocol commands.
   *
   * @param method - The CDP method name (e.g., "Page.enable", "Runtime.evaluate")
   * @param params - Optional parameters for the CDP command
   * @returns Promise resolving to the typed CDP response
   *
   * @example
   * // Enable the Runtime domain
   * await page.sendCDP("Runtime.enable");
   *
   * @example
   * // Evaluate JavaScript with typed response
   * const result = await page.sendCDP<Protocol.Runtime.EvaluateResponse>(
   *   "Runtime.evaluate",
   *   { expression: "1 + 1" }
   * );
   */
  public sendCDP<T = unknown>(method: string, params?: object): Promise<T> {
    return this.mainSession.send<T>(method, params);
  }

  /** Seed the cached URL before navigation events converge. */
  public seedCurrentUrl(url: string | undefined | null): void {
    if (!url) return;
    try {
      const normalized = String(url).trim();
      if (!normalized) return;
      this._currentUrl = normalized;
    } catch {
      // ignore invalid url seeds
    }
  }

  public mainFrameId(): string {
    return this.registry.mainFrameId();
  }

  public mainFrame(): Frame {
    return this.mainFrameWrapper;
  }

  /**
   * Close this top-level page (tab). Best-effort via Target.closeTarget.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageClose" })
  public async close(): Promise<void> {
    try {
      await this.conn.send("Target.closeTarget", { targetId: this._targetId });
    } catch {
      // ignore
    }
    const deadline = Date.now() + 2000;
    while (Date.now() < deadline) {
      try {
        const targets = await this.conn.getTargets();
        if (!targets.some((t) => t.targetId === this._targetId)) {
          this.networkManager.dispose();
          return;
        }
      } catch {
        // ignore and retry
      }
      await new Promise((r) => setTimeout(r, 25));
    }
    this.networkManager.dispose();
    this.removeAllConsoleTaps();
    this.consoleListeners.clear();
  }

  public getFullFrameTree(): Protocol.Page.FrameTree {
    return this.asProtocolFrameTree(this.mainFrameId());
  }

  public asProtocolFrameTree(rootMainFrameId: string): Protocol.Page.FrameTree {
    return this.registry.asProtocolFrameTree(rootMainFrameId);
  }

  private async applyExtraHTTPHeadersToSession(
    session: CDPSessionLike,
    headers: Record<string, string>,
  ): Promise<void> {
    await session.send("Network.enable");
    await session.send("Network.setExtraHTTPHeaders", {
      headers: headers,
    });
  }

  private ensureOrdinal(frameId: string): number {
    const hit = this.frameOrdinals.get(frameId);
    if (hit !== undefined) return hit;
    const ord = this.nextOrdinal++;
    this.frameOrdinals.set(frameId, ord);
    return ord;
  }

  /** Public getter for snapshot code / handlers. */
  public getOrdinal(frameId: string): number {
    return this.ensureOrdinal(frameId);
  }

  public listAllFrameIds(): string[] {
    return this.registry.listAllFrames();
  }

  private ensureConsoleTaps(): void {
    if (this.consoleListeners.size === 0) return;

    this.installConsoleTap(this.mainSession);
    for (const session of this.sessions.values()) {
      this.installConsoleTap(session);
    }
  }

  private installConsoleTap(session: CDPSessionLike): void {
    const key = this.sessionKey(session);
    if (this.consoleHandlers.has(key)) return;

    void session.send("Runtime.enable").catch(() => {});

    const handler = (evt: Protocol.Runtime.ConsoleAPICalledEvent) => {
      this.emitConsole(evt);
    };

    session.on<Protocol.Runtime.ConsoleAPICalledEvent>(
      "Runtime.consoleAPICalled",
      handler,
    );

    this.consoleHandlers.set(key, handler);
  }

  private sessionKey(session: CDPSessionLike): string {
    return session.id ?? "__root__";
  }

  private resolveSessionByKey(key: string): CDPSessionLike | undefined {
    if (this.mainSession.id) {
      if (this.mainSession.id === key) return this.mainSession;
    } else if (key === "__root__") {
      return this.mainSession;
    }

    return this.sessions.get(key);
  }

  private teardownConsoleTap(key: string): void {
    const handler = this.consoleHandlers.get(key);
    if (!handler) return;

    const session = this.resolveSessionByKey(key);
    session?.off("Runtime.consoleAPICalled", handler);
    this.consoleHandlers.delete(key);
  }

  private removeAllConsoleTaps(): void {
    for (const key of [...this.consoleHandlers.keys()]) {
      this.teardownConsoleTap(key);
    }
  }

  private emitConsole(evt: Protocol.Runtime.ConsoleAPICalledEvent): void {
    if (this.consoleListeners.size === 0) return;

    const message = new ConsoleMessage(evt, this);
    const listeners = [...this.consoleListeners];

    for (const listener of listeners) {
      try {
        listener(message);
      } catch (error) {
        v3Logger({
          category: "page",
          message: "Console listener threw",
          level: 2,
          auxiliary: {
            error: { value: String(error), type: "string" },
            type: { value: evt.type, type: "string" },
          },
        });
      }
    }
  }

  // -------- Convenience APIs delegated to the current main frame --------

  /**
   * Navigate the page; optionally wait for a lifecycle state.
   * Waits on the **current** main frame and follows root swaps during navigation.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageGoto" })
  async goto(
    url: string,
    options?: { waitUntil?: LoadState; timeoutMs?: number },
  ): Promise<Response | null> {
    const waitUntil: LoadState = options?.waitUntil ?? "domcontentloaded";
    const timeout = options?.timeoutMs ?? 15000;

    const navigationCommandId = this.beginNavigationCommand();
    const tracker = new NavigationResponseTracker({
      page: this,
      session: this.mainSession,
      navigationCommandId,
    });

    const watcher = new LifecycleWatcher({
      page: this,
      mainSession: this.mainSession,
      networkManager: this.networkManager,
      waitUntil,
      timeoutMs: timeout,
      navigationCommandId,
    });

    try {
      // Route to API if available
      if (this.apiClient) {
        const result = await this.apiClient.goto(
          url,
          { waitUntil: options?.waitUntil },
          this.mainFrameId(),
        );
        this._currentUrl = url;

        if (isSerializableResponse(result)) {
          return Response.fromSerializable(result, {
            page: this,
            session: this.mainSession,
          });
        }
        return result;
      }
      const response =
        await this.mainSession.send<Protocol.Page.NavigateResponse>(
          "Page.navigate",
          { url },
        );
      this._currentUrl = url;
      if (response?.loaderId) {
        watcher.setExpectedLoaderId(response.loaderId);
        tracker.setExpectedLoaderId(response.loaderId);
      }
      await watcher.wait();
      return await tracker.navigationCompleted();
    } finally {
      watcher.dispose();
      tracker.dispose();
    }
  }

  /**
   * Reload the page; optionally wait for a lifecycle state.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageReload" })
  async reload(options?: {
    waitUntil?: LoadState;
    timeoutMs?: number;
    ignoreCache?: boolean;
  }): Promise<Response | null> {
    const waitUntil = options?.waitUntil;
    const timeout = options?.timeoutMs ?? 15000;

    const navigationCommandId = this.beginNavigationCommand();

    const tracker = new NavigationResponseTracker({
      page: this,
      session: this.mainSession,
      navigationCommandId,
    });
    tracker.expectNavigationWithoutKnownLoader();

    const watcher = waitUntil
      ? new LifecycleWatcher({
          page: this,
          mainSession: this.mainSession,
          networkManager: this.networkManager,
          waitUntil,
          timeoutMs: timeout,
          navigationCommandId,
        })
      : null;

    try {
      await this.mainSession.send("Page.reload", {
        ignoreCache: options?.ignoreCache ?? false,
      });

      if (watcher) {
        await watcher.wait();
      }
      return await tracker.navigationCompleted();
    } finally {
      watcher?.dispose();
      tracker.dispose();
    }
  }

  /**
   * Navigate back in history if possible; optionally wait for a lifecycle state.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageGoBack" })
  async goBack(options?: {
    waitUntil?: LoadState;
    timeoutMs?: number;
  }): Promise<Response | null> {
    const { entries, currentIndex } =
      await this.mainSession.send<Protocol.Page.GetNavigationHistoryResponse>(
        "Page.getNavigationHistory",
      );
    const prev = entries[currentIndex - 1];
    if (!prev) return null; // nothing to do
    const waitUntil = options?.waitUntil;
    const timeout = options?.timeoutMs ?? 15000;

    const navigationCommandId = this.beginNavigationCommand();

    const tracker = new NavigationResponseTracker({
      page: this,
      session: this.mainSession,
      navigationCommandId,
    });
    tracker.expectNavigationWithoutKnownLoader();

    const watcher = waitUntil
      ? new LifecycleWatcher({
          page: this,
          mainSession: this.mainSession,
          networkManager: this.networkManager,
          waitUntil,
          timeoutMs: timeout,
          navigationCommandId,
        })
      : null;

    try {
      await this.mainSession.send("Page.navigateToHistoryEntry", {
        entryId: prev.id,
      });
      this._currentUrl = prev.url ?? this._currentUrl;

      if (watcher) {
        await watcher.wait();
      }
      return await tracker.navigationCompleted();
    } finally {
      watcher?.dispose();
      tracker.dispose();
    }
  }

  /**
   * Navigate forward in history if possible; optionally wait for a lifecycle state.
   */
  @FlowLogger.wrapWithLogging({
    eventType: "PageGoForward",
  })
  async goForward(options?: {
    waitUntil?: LoadState;
    timeoutMs?: number;
  }): Promise<Response | null> {
    const { entries, currentIndex } =
      await this.mainSession.send<Protocol.Page.GetNavigationHistoryResponse>(
        "Page.getNavigationHistory",
      );
    const next = entries[currentIndex + 1];
    if (!next) return null; // nothing to do
    const waitUntil = options?.waitUntil;
    const timeout = options?.timeoutMs ?? 15000;

    const navigationCommandId = this.beginNavigationCommand();

    const tracker = new NavigationResponseTracker({
      page: this,
      session: this.mainSession,
      navigationCommandId,
    });
    tracker.expectNavigationWithoutKnownLoader();

    const watcher = waitUntil
      ? new LifecycleWatcher({
          page: this,
          mainSession: this.mainSession,
          networkManager: this.networkManager,
          waitUntil,
          timeoutMs: timeout,
          navigationCommandId,
        })
      : null;

    try {
      await this.mainSession.send("Page.navigateToHistoryEntry", {
        entryId: next.id,
      });
      this._currentUrl = next.url ?? this._currentUrl;

      if (watcher) {
        await watcher.wait();
      }
      return await tracker.navigationCompleted();
    } finally {
      watcher?.dispose();
      tracker.dispose();
    }
  }

  /**
   * Return the current page URL (synchronous, cached from navigation events).
   */
  url(): string {
    return this._currentUrl;
  }

  private beginNavigationCommand(): number {
    const id = ++this.navigationCommandSeq;
    this.latestNavigationCommandId = id;
    return id;
  }

  public isCurrentNavigationCommand(id: number): boolean {
    return this.latestNavigationCommandId === id;
  }

  /**
   * Return the current page title.
   * Prefers reading from the active document via Runtime.evaluate to reflect dynamic changes.
   * Falls back to navigation history title if evaluation is unavailable.
   */
  async title(): Promise<string> {
    try {
      await this.mainSession.send("Runtime.enable").catch(() => {});
      const ctxId = await this.mainWorldExecutionContextId();
      const { result } =
        await this.mainSession.send<Protocol.Runtime.EvaluateResponse>(
          "Runtime.evaluate",
          {
            expression: "document.title",
            contextId: ctxId,
            returnByValue: true,
          },
        );
      return String(result?.value ?? "");
    } catch {
      // Fallback: use navigation history entry title
      try {
        const { entries, currentIndex } =
          await this.mainSession.send<Protocol.Page.GetNavigationHistoryResponse>(
            "Page.getNavigationHistory",
          );
        return entries[currentIndex]?.title ?? "";
      } catch {
        return "";
      }
    }
  }

  /**
   * Capture a screenshot with Playwright-style options.
   *
   * @param options Optional screenshot configuration.
   * @param options.animations Control CSS/Web animations during capture. Use
   * "disabled" to fast-forward finite animations and pause infinite ones.
   * @param options.caret Either hide the text caret (default) or leave it
   * visible via "initial".
   * @param options.clip Restrict capture to a specific rectangle (in CSS
   * pixels). Cannot be combined with `fullPage`.
   * @param options.fullPage Capture the full scrollable page instead of the
   * current viewport.
   * @param options.mask Array of locators that should be covered with an
   * overlay while the screenshot is taken.
   * @param options.maskColor CSS color used for the mask overlay (default
   * `#FF00FF`).
   * @param options.omitBackground Make the default page background transparent
   * (PNG only).
   * @param options.path File path to write the screenshot to. The file extension
   * determines the image type when `type` is not explicitly provided.
   * @param options.quality JPEG quality (0–100). Only applies when
   * `type === "jpeg"`.
   * @param options.scale Render scale: use "css" for one pixel per CSS pixel,
   * otherwise the default "device" leverages the current device pixel ratio.
   * @param options.style Additional CSS text injected into every frame before
   * capture (removed afterwards).
   * @param options.timeout Maximum capture duration in milliseconds before a
   * timeout error is thrown.
   * @param options.type Image format (`"png"` by default).
   */
  @FlowLogger.wrapWithLogging({
    eventType: "PageScreenshot",
  })
  async screenshot(options?: ScreenshotOptions): Promise<Buffer> {
    const opts = options ?? {};
    const type = opts.type ?? "png";

    if (type !== "png" && type !== "jpeg") {
      throw new StagehandInvalidArgumentError(
        `screenshot: unsupported image type "${type}"`,
      );
    }

    if (opts.fullPage && opts.clip) {
      throw new StagehandInvalidArgumentError(
        "screenshot: clip and fullPage cannot be used together",
      );
    }

    if (type === "png" && typeof opts.quality === "number") {
      throw new StagehandInvalidArgumentError(
        'screenshot: quality option is only valid for type="jpeg"',
      );
    }

    const caretMode: ScreenshotCaretOption = opts.caret ?? "hide";
    const animationsMode: ScreenshotAnimationsOption =
      opts.animations ?? "allow";
    const scaleMode: ScreenshotScaleOption = opts.scale ?? "device";
    const frames = collectFramesForScreenshot(this);
    const clip = opts.clip ? normalizeScreenshotClip(opts.clip) : undefined;
    const captureScale = await computeScreenshotScale(this, scaleMode);
    const maskLocators = (opts.mask ?? []).filter(
      (locator): locator is Locator => Boolean(locator),
    );

    const cleanupTasks: ScreenshotCleanup[] = [];

    const exec = async (): Promise<Buffer> => {
      try {
        if (opts.omitBackground) {
          cleanupTasks.push(await setTransparentBackground(this.mainSession));
        }

        if (animationsMode === "disabled") {
          cleanupTasks.push(await disableAnimations(frames));
        }

        if (caretMode === "hide") {
          cleanupTasks.push(await hideCaret(frames));
        }

        if (opts.style && opts.style.trim()) {
          cleanupTasks.push(
            await applyStyleToFrames(frames, opts.style, "custom"),
          );
        }

        if (maskLocators.length > 0) {
          cleanupTasks.push(
            await applyMaskOverlays(maskLocators, opts.maskColor ?? "#FF00FF"),
          );
        }

        const buffer = await this.mainFrameWrapper.screenshot({
          fullPage: opts.fullPage,
          clip,
          type,
          quality: type === "jpeg" ? opts.quality : undefined,
          scale: captureScale,
        });

        if (opts.path) {
          await fs.writeFile(opts.path, buffer);
        }

        return buffer;
      } finally {
        await runScreenshotCleanups(cleanupTasks);
      }
    };

    return await withTimeout(exec(), opts.timeout, "screenshot");
  }

  /**
   * specifies additional HTTP headers to be included in every request sent by
   * the root CDP session of the page, and all of its child CDP sessions.
   *
   * @param headers - the headers to be set.
   * @throws {StagehandSetExtraHTTPHeadersError}
   * Thrown when one or more CDP sessions fail to enable the Network domain or fail
   * to apply the headers (i.e. `Network.enable` and/or `Network.setExtraHTTPHeaders` rejects).
   * @return void
   */
  async setExtraHTTPHeaders(headers: Record<string, string>): Promise<void> {
    const headersToSet = { ...headers };
    this.extraHTTPHeaders = headersToSet;

    // get the session(s) for this page:
    const sessions: CDPSessionLike[] = [this.mainSession];
    for (const session of this.sessions.values()) {
      if (session === this.mainSession) continue;
      sessions.push(session);
    }

    const results = await Promise.allSettled(
      sessions.map(async (session) => {
        await this.applyExtraHTTPHeadersToSession(session, headersToSet);
      }),
    );

    // get list of objects containing results & corresponding session IDs
    const pairs = results.map((result, index) => ({
      result,
      id: sessions[index].id,
    }));

    const filtered = pairs.filter(
      (pair): pair is { result: PromiseRejectedResult; id: string | null } =>
        pair.result.status === "rejected",
    );

    const errors = filtered.map((pair) => {
      const reason = pair.result.reason;
      const sessId = pair.id ?? "root";
      const message = reason?.message ?? String(reason);
      return `session=${sessId} error=${message}`;
    });

    if (errors.length > 0) {
      throw new StagehandSetExtraHTTPHeadersError(errors);
    }
  }

  /**
   * Create a locator bound to the current main frame.
   */
  locator(selector: string): ReturnType<Frame["locator"]> {
    return this.mainFrameWrapper.locator(selector);
  }

  /**
   * Deep locator that supports cross-iframe traversal.
   * - Recognizes '>>' hop notation to enter iframe contexts.
   * - Supports deep XPath that includes iframe steps (e.g., '/html/body/iframe[2]//div').
   * Returns a Locator scoped to the appropriate frame.
   */
  deepLocator(selector: string) {
    return deepLocatorFromPage(this, this.mainFrameWrapper, selector);
  }

  /**
   * Frame locator similar to Playwright: targets iframe elements and scopes
   * subsequent locators to that frame. Supports chaining.
   */
  frameLocator(selector: string): FrameLocator {
    return new FrameLocator(this, selector);
  }

  /**
   * List all frames belonging to this page as Frame objects bound to their owning sessions.
   * The list is ordered by a stable ordinal assigned during the page lifetime.
   */
  frames(): Frame[] {
    const ids = this.listAllFrameIds();
    const withOrd = ids.map((id) => ({ id, ord: this.getOrdinal(id) }));
    withOrd.sort((a, b) => a.ord - b.ord);
    return withOrd.map(({ id }) => this.frameForId(id));
  }

  /**
   * Wait until the page reaches a lifecycle state on the current main frame.
   * Mirrors Playwright's API signatures.
   */
  @FlowLogger.wrapWithLogging({
    eventType: "PageWaitForLoadState",
  })
  async waitForLoadState(state: LoadState, timeoutMs?: number): Promise<void> {
    await this.waitForMainLoadState(state, timeoutMs ?? 15000);
  }

  /**
   * Wait for a specified amount of time.
   *
   * @param ms The number of milliseconds to wait.
   */
  async waitForTimeout(ms: number): Promise<void> {
    return new Promise((resolve) => setTimeout(resolve, ms));
  }

  /**
   * Wait for an element matching the selector to appear in the DOM.
   * Uses MutationObserver for efficiency
   * Pierces shadow DOM by default.
   * Supports iframe hop notation with '>>' (e.g., 'iframe#checkout >> .submit-btn').
   *
   * @param selector CSS selector to wait for (supports '>>' for iframe hops)
   * @param options
   * @param options.state Element state to wait for: 'attached' | 'detached' | 'visible' | 'hidden' (default: 'visible')
   * @param options.timeout Maximum time to wait in milliseconds (default: 30000)
   * @param options.pierceShadow Whether to search inside shadow DOM (default: true)
   * @returns True when the condition is met
   * @throws Error if timeout is reached before the condition is met
   */
  @FlowLogger.wrapWithLogging({
    eventType: "PageWaitForSelector",
  })
  async waitForSelector(
    selector: string,
    options?: {
      state?: "attached" | "detached" | "visible" | "hidden";
      timeout?: number;
      pierceShadow?: boolean;
    },
  ): Promise<boolean> {
    const timeout = options?.timeout ?? 30000;
    const state = options?.state ?? "visible";
    const pierceShadow = options?.pierceShadow ?? true;
    const startTime = Date.now();
    const root = this.mainFrameWrapper;
    const { frame: targetFrame, selector: finalSelector } =
      await resolveLocatorTarget(this, root, selector);
    const elapsed = Date.now() - startTime;
    const remainingTimeout = Math.max(0, timeout - elapsed);

    const expression = buildLocatorInvocation("waitForSelector", [
      JSON.stringify(finalSelector),
      JSON.stringify(state),
      String(remainingTimeout),
      String(pierceShadow),
    ]);
    return targetFrame.evaluate(expression);
  }

  /**
   * Evaluate a function or expression in the current main frame's main world.
   * - If a string is provided, it is treated as a JS expression.
   * - If a function is provided, it is stringified and invoked with the optional argument.
   * - The return value should be JSON-serializable. Non-serializable objects will
   *   best-effort serialize via JSON.stringify inside the page context.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageEvaluate" })
  async evaluate<R = unknown, Arg = unknown>(
    pageFunctionOrExpression: string | ((arg: Arg) => R | Promise<R>),
    arg?: Arg,
  ): Promise<R> {
    await this.mainSession.send("Runtime.enable").catch(() => {});
    const ctxId = await this.mainWorldExecutionContextId();

    const isString = typeof pageFunctionOrExpression === "string";
    let expression: string;

    if (isString) {
      expression = String(pageFunctionOrExpression);
    } else {
      const fnSrc = pageFunctionOrExpression.toString();
      const argJson = JSON.stringify(arg);
      expression = `(() => {
          const __fn = ${fnSrc};
          const __arg = ${argJson};
          try {
            const __res = __fn(__arg);
            return Promise.resolve(__res).then(v => {
              try { return JSON.parse(JSON.stringify(v)); } catch { return v; }
            });
          } catch (e) { throw e; }
        })()`;
    }

    const { result, exceptionDetails } =
      await this.mainSession.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression,
          contextId: ctxId,
          returnByValue: true,
          awaitPromise: true,
        },
      );

    if (exceptionDetails) {
      const msg =
        exceptionDetails.text ||
        exceptionDetails.exception?.description ||
        "Evaluation failed";
      throw new StagehandEvalError(msg);
    }

    return result?.value as R;
  }

  /**
   * Force the page viewport to an exact CSS size and device scale factor.
   * Ensures screenshots match width x height pixels when deviceScaleFactor = 1.
   */
  // @FlowLogger.wrapWithLogging({ eventType: "PageSetViewportSize" })  // disabled because it's pretty noisy, can always re-enable if needed for debugging
  async setViewportSize(
    width: number,
    height: number,
    options?: { deviceScaleFactor?: number },
  ): Promise<void> {
    const dsf = Math.max(0.01, options?.deviceScaleFactor ?? 1);
    await this.mainSession
      .send("Emulation.setDeviceMetricsOverride", {
        width,
        height,
        deviceScaleFactor: dsf,
        mobile: false,
        screenWidth: width,
        screenHeight: height,
        positionX: 0,
        positionY: 0,
        scale: 1,
      } as Protocol.Emulation.SetDeviceMetricsOverrideRequest)
      .catch(() => {});

    // Best-effort ensure visible size in headless
    await this.mainSession
      .send("Emulation.setVisibleSize", { width, height })
      .catch(() => {});
  }

  /**
   * Click at absolute page coordinates (CSS pixels).
   * Dispatches mouseMoved → mousePressed → mouseReleased via CDP Input domain
   * on the top-level page target's session. Coordinates are relative to the
   * viewport origin (top-left). Does not scroll.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageClick" })
  async click(
    x: number,
    y: number,
    options?: {
      button?: "left" | "right" | "middle";
      clickCount?: number;
      returnXpath?: boolean;
    },
  ): Promise<string> {
    const button = options?.button ?? "left";
    const clickCount = options?.clickCount ?? 1;

    let xpathResult: string | undefined;
    if (options?.returnXpath) {
      // Resolve the deepest node at the given coordinates and compute absolute XPath efficiently
      try {
        const hit = await resolveXpathForLocation(this, x, y);
        if (hit) {
          v3Logger({
            category: "page",
            message: "click resolved hit",
            level: 2,
            auxiliary: {
              frameId: { value: String(hit.frameId), type: "string" },
              backendNodeId: {
                value: String(hit.backendNodeId),
                type: "string",
              },
              x: { value: String(x), type: "integer" },
              y: { value: String(y), type: "integer" },
            },
          });
          xpathResult = hit.absoluteXPath;
          v3Logger({
            category: "page",
            message: `click resolved xpath`,
            level: 2,
            auxiliary: {
              xpath: { value: String(xpathResult ?? ""), type: "string" },
            },
          });
        }
      } catch {
        // best-effort; fall through if any step fails
      }
    }

    // Synthesize a simple mouse move + press + release sequence.
    await this.updateCursor(x, y);
    // Dispatch click events in a pipelined burst to reduce inter-click delay
    // from network/CPU jitter between round trips.
    const dispatches: Array<Promise<unknown>> = [];
    dispatches.push(
      this.mainSession.send<never>("Input.dispatchMouseEvent", {
        type: "mouseMoved",
        x,
        y,
        button: "none",
      } as Protocol.Input.DispatchMouseEventRequest),
    );

    for (let i = 1; i <= clickCount; i++) {
      dispatches.push(
        this.mainSession.send<never>("Input.dispatchMouseEvent", {
          type: "mousePressed",
          x,
          y,
          button,
          clickCount: i,
        } as Protocol.Input.DispatchMouseEventRequest),
      );
      dispatches.push(
        this.mainSession.send<never>("Input.dispatchMouseEvent", {
          type: "mouseReleased",
          x,
          y,
          button,
          clickCount: i,
        } as Protocol.Input.DispatchMouseEventRequest),
      );
    }
    await Promise.all(dispatches);

    return xpathResult ?? "";
  }

  /**
   * Hover at absolute page coordinates (CSS pixels).
   * Dispatches mouseMoved via CDP Input domain on the top-level page target's
   * session.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageHover" })
  async hover(
    x: number,
    y: number,
    options?: { returnXpath?: boolean },
  ): Promise<string> {
    let xpathResult: string | undefined;
    if (options?.returnXpath) {
      try {
        const hit = await resolveXpathForLocation(this, x, y);
        if (hit) {
          v3Logger({
            category: "page",
            message: "hover resolved hit",
            level: 2,
            auxiliary: {
              frameId: { value: String(hit.frameId), type: "string" },
              backendNodeId: {
                value: String(hit.backendNodeId),
                type: "string",
              },
              x: { value: String(x), type: "integer" },
              y: { value: String(y), type: "integer" },
            },
          });
          xpathResult = hit.absoluteXPath;
        }
      } catch {
        v3Logger({
          category: "page",
          message: "Failed to resolve xpath for hover",
          level: 2,
          auxiliary: {
            x: { value: String(x), type: "integer" },
            y: { value: String(y), type: "integer" },
          },
        });
      }
    }

    await this.updateCursor(x, y);
    await this.mainSession.send<never>("Input.dispatchMouseEvent", {
      type: "mouseMoved",
      x,
      y,
      button: "none",
    } as Protocol.Input.DispatchMouseEventRequest);

    return xpathResult ?? "";
  }

  @FlowLogger.wrapWithLogging({ eventType: "PageScroll" })
  async scroll(
    x: number,
    y: number,
    deltaX: number,
    deltaY: number,
    options?: { returnXpath?: boolean },
  ): Promise<string> {
    let xpathResult: string | undefined;
    if (options?.returnXpath) {
      try {
        const hit = await resolveXpathForLocation(this, x, y);
        if (hit) xpathResult = hit.absoluteXPath;
      } catch {
        // best-effort
      }
    }

    await this.updateCursor(x, y);
    await this.mainSession.send<never>("Input.dispatchMouseEvent", {
      type: "mouseMoved",
      x,
      y,
      button: "none",
    } as Protocol.Input.DispatchMouseEventRequest);

    // Synthesize a simple mouse move + press + release sequence
    await this.mainSession.send<never>("Input.dispatchMouseEvent", {
      type: "mouseWheel",
      x,
      y,
      button: "none",
      deltaX,
      deltaY,
    } as Protocol.Input.DispatchMouseEventRequest);

    return xpathResult ?? "";
  }

  /**
   * Drag from (fromX, fromY) to (toX, toY) using mouse events.
   * Sends mouseMoved → mousePressed → mouseMoved (steps) → mouseReleased.
   */
  @FlowLogger.wrapWithLogging({
    eventType: "PageDragAndDrop",
  })
  async dragAndDrop(
    fromX: number,
    fromY: number,
    toX: number,
    toY: number,
    options?: {
      button?: "left" | "right" | "middle";
      steps?: number;
      delay?: number;
      returnXpath?: boolean;
    },
  ): Promise<[string, string]> {
    const button = options?.button ?? "left";
    const steps = Math.max(1, Math.floor(options?.steps ?? 1));
    const delay = Math.max(0, options?.delay ?? 0);

    const sleep = (ms: number) =>
      new Promise<void>((r) => (ms > 0 ? setTimeout(r, ms) : r()));

    const buttonMask = (b: typeof button): number => {
      switch (b) {
        case "left":
          return 1;
        case "right":
          return 2;
        case "middle":
          return 4;
        default:
          return 1;
      }
    };

    let fromXpath: string | undefined;
    let toXpath: string | undefined;
    if (options?.returnXpath) {
      try {
        const start = await resolveXpathForLocation(this, fromX, fromY);
        if (start) fromXpath = start.absoluteXPath;
      } catch {
        //
      }
      try {
        const end = await resolveXpathForLocation(this, toX, toY);
        if (end) toXpath = end.absoluteXPath;
      } catch {
        //
      }
    }

    // Move to start
    await this.updateCursor(fromX, fromY);
    await this.mainSession.send<never>("Input.dispatchMouseEvent", {
      type: "mouseMoved",
      x: fromX,
      y: fromY,
      button: "none",
    } as Protocol.Input.DispatchMouseEventRequest);

    // Press
    await this.mainSession.send<never>("Input.dispatchMouseEvent", {
      type: "mousePressed",
      x: fromX,
      y: fromY,
      button,
      buttons: buttonMask(button),
      clickCount: 1,
    } as Protocol.Input.DispatchMouseEventRequest);

    // Intermediate moves
    for (let i = 1; i <= steps; i++) {
      const t = i / steps;
      const x = fromX + (toX - fromX) * t;
      const y = fromY + (toY - fromY) * t;
      await this.updateCursor(x, y);
      await this.mainSession.send<never>("Input.dispatchMouseEvent", {
        type: "mouseMoved",
        x,
        y,
        button,
        buttons: buttonMask(button),
      } as Protocol.Input.DispatchMouseEventRequest);
      if (delay) await sleep(delay);
    }

    // Release at end
    await this.updateCursor(toX, toY);
    await this.mainSession.send<never>("Input.dispatchMouseEvent", {
      type: "mouseReleased",
      x: toX,
      y: toY,
      button,
      buttons: buttonMask(button),
      clickCount: 1,
    } as Protocol.Input.DispatchMouseEventRequest);

    return [fromXpath ?? "", toXpath ?? ""];
  }

  /**
   * Type a string by dispatching keyDown/keyUp events per character.
   * Focus must already be on the desired element. Uses CDP Input.dispatchKeyEvent
   * and never falls back to Input.insertText. Optional delay applies between
   * successive characters.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageType" })
  async type(
    text: string,
    options?: { delay?: number; withMistakes?: boolean },
  ): Promise<void> {
    const delay = Math.max(0, options?.delay ?? 0);
    const withMistakes = !!options?.withMistakes;

    const sleep = (ms: number) =>
      new Promise<void>((r) => (ms > 0 ? setTimeout(r, ms) : r()));

    const keyStroke = async (
      ch: string,
      override?: {
        key?: string;
        code?: string;
        windowsVirtualKeyCode?: number;
      },
    ) => {
      if (override) {
        const base: Protocol.Input.DispatchKeyEventRequest = {
          type: "keyDown",
          key: override.key,
          code: override.code,
          windowsVirtualKeyCode: override.windowsVirtualKeyCode,
        } as Protocol.Input.DispatchKeyEventRequest;
        await this.mainSession.send("Input.dispatchKeyEvent", base);
        await this.mainSession.send("Input.dispatchKeyEvent", {
          ...base,
          type: "keyUp",
        } as Protocol.Input.DispatchKeyEventRequest);
        return;
      }

      // Printable character: include key, code, and text for maximum compatibility
      // Some sites (like Wordle) check event.key rather than relying on text input
      const isLetter = /^[a-zA-Z]$/.test(ch);
      const isDigit = /^[0-9]$/.test(ch);

      let key = ch;
      let code = "";
      let windowsVirtualKeyCode: number | undefined;

      if (isLetter) {
        // For letters, key is the character, code is KeyX where X is uppercase
        key = ch;
        code = `Key${ch.toUpperCase()}`;
        windowsVirtualKeyCode = ch.toUpperCase().charCodeAt(0);
      } else if (isDigit) {
        key = ch;
        code = `Digit${ch}`;
        windowsVirtualKeyCode = ch.charCodeAt(0);
      } else if (ch === " ") {
        key = " ";
        code = "Space";
        windowsVirtualKeyCode = 32;
      }

      const down: Protocol.Input.DispatchKeyEventRequest = {
        type: "keyDown",
        key,
        code: code || undefined,
        text: ch,
        unmodifiedText: ch,
        windowsVirtualKeyCode,
      };
      await this.mainSession.send("Input.dispatchKeyEvent", down);
      await this.mainSession.send("Input.dispatchKeyEvent", {
        type: "keyUp",
        key,
        code: code || undefined,
        windowsVirtualKeyCode,
      } as Protocol.Input.DispatchKeyEventRequest);
    };

    const pressBackspace = async () =>
      keyStroke("\b", {
        key: "Backspace",
        code: "Backspace",
        windowsVirtualKeyCode: 8,
      });

    const randomPrintable = (avoid: string): string => {
      const pool =
        "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789 .,;:'\"!?@#$%^&*()-_=+[]{}<>/\\|`~";
      let c = avoid;
      while (c === avoid) {
        c = pool[Math.floor(Math.random() * pool.length)];
      }
      return c;
    };

    for (const ch of text) {
      // Control keys that we explicitly map
      if (ch === "\n" || ch === "\r") {
        await keyStroke(ch, {
          key: "Enter",
          code: "Enter",
          windowsVirtualKeyCode: 13,
        });
      } else if (ch === "\t") {
        await keyStroke(ch, {
          key: "Tab",
          code: "Tab",
          windowsVirtualKeyCode: 9,
        });
      } else {
        if (withMistakes && Math.random() < 0.12) {
          // Type a wrong character, then backspace to correct
          const wrong = randomPrintable(ch);
          await keyStroke(wrong);
          if (delay) await sleep(delay);
          await pressBackspace();
          if (delay) await sleep(delay);
        }
        await keyStroke(ch);
      }

      if (delay) await sleep(delay);
    }
  }

  /**
   * Press a single key or key combination (keyDown then keyUp).
   * For printable characters, uses the text path on keyDown; for named keys, sets key/code/VK.
   * Supports key combinations with modifiers like "Cmd+A", "Ctrl+C", "Shift+Tab", etc.
   */
  @FlowLogger.wrapWithLogging({ eventType: "PageKeyPress" })
  async keyPress(key: string, options?: { delay?: number }): Promise<void> {
    const delay = Math.max(0, options?.delay ?? 0);
    const sleep = (ms: number) =>
      new Promise<void>((r) => (ms > 0 ? setTimeout(r, ms) : r()));

    // Split key combination by + but handle the special case of "+" key itself
    function split(keyString: string): string[] {
      // Special case: if the entire string is just "+", return it as-is
      if (keyString === "+") {
        return ["+"];
      }

      const keys: string[] = [];
      let building = "";
      for (const char of keyString) {
        if (char === "+" && building) {
          keys.push(building);
          building = "";
        } else {
          building += char;
        }
      }
      if (building) {
        keys.push(building);
      }
      return keys;
    }

    const tokens = split(key);
    const mainKey = tokens[tokens.length - 1];
    const modifierKeys = tokens.slice(0, -1);

    try {
      for (const modKey of modifierKeys) {
        await this.keyDown(modKey);
      }

      await this.keyDown(mainKey);
      if (delay) await sleep(delay);
      await this.keyUp(mainKey);

      for (let i = modifierKeys.length - 1; i >= 0; i--) {
        await this.keyUp(modifierKeys[i]);
      }
    } catch (error) {
      // Clear stuck modifiers on error to prevent affecting subsequent keyPress calls
      this._pressedModifiers.clear();
      throw error;
    }
  }

  @FlowLogger.wrapWithLogging({ eventType: "PageSnapshot" })
  async snapshot(options?: PageSnapshotOptions): Promise<SnapshotResult> {
    try {
      const { combinedTree, combinedXpathMap, combinedUrlMap } =
        await captureHybridSnapshot(this, {
          pierceShadow: true,
          includeIframes: options?.includeIframes,
        });

      return {
        formattedTree: combinedTree,
        xpathMap: combinedXpathMap,
        urlMap: combinedUrlMap,
      };
    } catch (err) {
      throw new StagehandSnapshotError(err);
    }
  }

  // Track pressed modifier keys
  private _pressedModifiers = new Set<string>();

  /** Press a key down without releasing it */
  private async keyDown(key: string): Promise<void> {
    const normalizedKey = this.normalizeModifierKey(key);

    const modifierKeys = ["Alt", "Control", "Meta", "Shift"];
    if (modifierKeys.includes(normalizedKey)) {
      this._pressedModifiers.add(normalizedKey);
    }

    let modifiers = 0;
    if (this._pressedModifiers.has("Alt")) modifiers |= 1;
    if (this._pressedModifiers.has("Control")) modifiers |= 2;
    if (this._pressedModifiers.has("Meta")) modifiers |= 4;
    if (this._pressedModifiers.has("Shift")) modifiers |= 8;

    const named = this.getNamedKeys();

    if (normalizedKey.length === 1) {
      const hasNonShiftModifier =
        this._pressedModifiers.has("Alt") ||
        this._pressedModifiers.has("Control") ||
        this._pressedModifiers.has("Meta");
      if (hasNonShiftModifier) {
        // For accelerators (e.g., Cmd/Ctrl/Alt + key), do not send text. Use rawKeyDown with key/code/VK.
        const desc = this.describePrintableKey(normalizedKey);
        const macCommands = this.isMacOS()
          ? this.macCommandsFor(desc.code ?? "")
          : [];
        const req: Protocol.Input.DispatchKeyEventRequest = {
          type: "rawKeyDown",
          modifiers,
          key: desc.key,
          ...(desc.code ? { code: desc.code } : {}),
          ...(typeof desc.vk === "number"
            ? { windowsVirtualKeyCode: desc.vk }
            : {}),
          ...(macCommands.length ? { commands: macCommands } : {}),
        } as Protocol.Input.DispatchKeyEventRequest;
        await this.mainSession.send("Input.dispatchKeyEvent", req);
      } else {
        // Typing path (no non-Shift modifiers): send text to generate input
        await this.mainSession.send("Input.dispatchKeyEvent", {
          type: "keyDown",
          text: normalizedKey,
          unmodifiedText: normalizedKey,
          modifiers,
        } as Protocol.Input.DispatchKeyEventRequest);
      }
      return;
    }

    const entry = named[normalizedKey] ?? null;
    if (entry) {
      const macCommands = this.isMacOS() ? this.macCommandsFor(entry.code) : [];
      const includeText = !!entry.text && modifiers === 0;
      const keyDown: Protocol.Input.DispatchKeyEventRequest = {
        type: includeText ? "keyDown" : "rawKeyDown",
        key: entry.key,
        code: entry.code,
        windowsVirtualKeyCode: entry.vk,
        modifiers,
        ...(includeText
          ? {
              text: entry.text,
              unmodifiedText: entry.unmodifiedText ?? entry.text,
            }
          : {}),
        ...(macCommands.length ? { commands: macCommands } : {}),
      } as Protocol.Input.DispatchKeyEventRequest;
      await this.mainSession.send("Input.dispatchKeyEvent", keyDown);
      return;
    }

    // Fallback: send with key property only
    await this.mainSession.send("Input.dispatchKeyEvent", {
      type: "keyDown",
      key: normalizedKey,
      modifiers,
    } as Protocol.Input.DispatchKeyEventRequest);
  }

  /** Release a pressed key */
  private async keyUp(key: string): Promise<void> {
    const normalizedKey = this.normalizeModifierKey(key);

    let modifiers = 0;
    if (this._pressedModifiers.has("Alt")) modifiers |= 1;
    if (this._pressedModifiers.has("Control")) modifiers |= 2;
    if (this._pressedModifiers.has("Meta")) modifiers |= 4;
    if (this._pressedModifiers.has("Shift")) modifiers |= 8;

    const modifierKeys = ["Alt", "Control", "Meta", "Shift"];
    if (modifierKeys.includes(normalizedKey)) {
      this._pressedModifiers.delete(normalizedKey);
    }

    const named = this.getNamedKeys();

    if (normalizedKey.length === 1) {
      const desc = this.describePrintableKey(normalizedKey);
      await this.mainSession.send("Input.dispatchKeyEvent", {
        type: "keyUp",
        key: desc.key,
        code: desc.code,
        windowsVirtualKeyCode:
          typeof desc.vk === "number" ? desc.vk : undefined,
        modifiers,
      } as Protocol.Input.DispatchKeyEventRequest);
      return;
    }

    const entry = named[normalizedKey] ?? null;
    if (entry) {
      await this.mainSession.send("Input.dispatchKeyEvent", {
        type: "keyUp",
        key: entry.key,
        code: entry.code,
        windowsVirtualKeyCode: entry.vk,
        modifiers,
      } as Protocol.Input.DispatchKeyEventRequest);
      return;
    }

    // Fallback: send with key property only
    await this.mainSession.send("Input.dispatchKeyEvent", {
      type: "keyUp",
      key: normalizedKey,
      modifiers,
    } as Protocol.Input.DispatchKeyEventRequest);
  }

  /** Normalize key names to match CDP expectations */
  private normalizeModifierKey(key: string): string {
    const lower = key.toLowerCase();
    switch (lower) {
      // Modifier keys
      case "cmd":
      case "command":
      case "controlormeta":
        // On Mac, Cmd is Meta; elsewhere map to Control for common shortcuts
        return this.isMacOS() ? "Meta" : "Control";
      case "win":
      case "windows":
        return "Meta";
      case "ctrl":
      case "control":
        return "Control";
      case "option":
      case "alt":
        return "Alt";
      case "shift":
        return "Shift";
      case "meta":
        return "Meta";
      // Action keys
      case "enter":
      case "return":
        return "Enter";
      case "esc":
      case "escape":
        return "Escape";
      case "backspace":
        return "Backspace";
      case "tab":
        return "Tab";
      case "space":
      case "spacebar":
        return " ";
      case "delete":
      case "del":
        return "Delete";
      // Arrow keys
      case "left":
      case "arrowleft":
        return "ArrowLeft";
      case "right":
      case "arrowright":
        return "ArrowRight";
      case "up":
      case "arrowup":
        return "ArrowUp";
      case "down":
      case "arrowdown":
        return "ArrowDown";
      // Navigation keys
      case "home":
        return "Home";
      case "end":
        return "End";
      case "pageup":
      case "pgup":
        return "PageUp";
      case "pagedown":
      case "pgdn":
        return "PageDown";
      default:
        return key;
    }
  }

  /**
   * Get the map of named keys with their properties
   */
  private getNamedKeys(): Record<
    string,
    {
      key: string;
      code: string;
      vk: number;
      text?: string;
      unmodifiedText?: string;
    }
  > {
    return {
      Enter: {
        key: "Enter",
        code: "Enter",
        vk: 13,
        text: "\r",
        unmodifiedText: "\r",
      },
      Tab: { key: "Tab", code: "Tab", vk: 9 },
      Backspace: { key: "Backspace", code: "Backspace", vk: 8 },
      Escape: { key: "Escape", code: "Escape", vk: 27 },
      Delete: { key: "Delete", code: "Delete", vk: 46 },
      ArrowLeft: { key: "ArrowLeft", code: "ArrowLeft", vk: 37 },
      ArrowUp: { key: "ArrowUp", code: "ArrowUp", vk: 38 },
      ArrowRight: { key: "ArrowRight", code: "ArrowRight", vk: 39 },
      ArrowDown: { key: "ArrowDown", code: "ArrowDown", vk: 40 },
      Home: { key: "Home", code: "Home", vk: 36 },
      End: { key: "End", code: "End", vk: 35 },
      PageUp: { key: "PageUp", code: "PageUp", vk: 33 },
      PageDown: { key: "PageDown", code: "PageDown", vk: 34 },
      // Modifier keys
      Alt: { key: "Alt", code: "AltLeft", vk: 18 },
      Control: { key: "Control", code: "ControlLeft", vk: 17 },
      Meta: { key: "Meta", code: "MetaLeft", vk: 91 },
      Shift: { key: "Shift", code: "ShiftLeft", vk: 16 },
    };
  }

  /**
   * Minimal description for printable keys (letters/digits/space) to provide code and VK.
   * Used when non-Shift modifiers are pressed to avoid sending text while keeping accelerator info.
   */
  private describePrintableKey(ch: string): {
    key: string;
    code?: string;
    vk?: number;
  } {
    const shiftDown = this._pressedModifiers.has("Shift");
    const isLetter = /^[a-zA-Z]$/.test(ch);
    const isDigit = /^[0-9]$/.test(ch);

    if (isLetter) {
      const upper = ch.toUpperCase();
      return {
        key: shiftDown ? upper : upper.toLowerCase(),
        code: `Key${upper}`,
        vk: upper.charCodeAt(0), // 'A'..'Z' => 65..90
      };
    }

    if (isDigit) {
      return {
        key: ch,
        code: `Digit${ch}`,
        vk: ch.charCodeAt(0), // '0'..'9' => 48..57
      };
    }

    if (ch === " ") {
      return { key: " ", code: "Space", vk: 32 };
    }

    // Fallback: just return the character as-is; VK best-effort from ASCII
    return {
      key: shiftDown ? ch.toUpperCase() : ch,
      vk: ch.toUpperCase().charCodeAt(0),
    };
  }

  private isMacOS(): boolean {
    try {
      return process.platform === "darwin";
    } catch {
      return false;
    }
  }

  /**
   * Return Chromium mac editing commands (without trailing ':') for a given code like 'KeyA'
   * Only used on macOS to trigger system editing shortcuts (e.g., selectAll, copy, paste...).
   */
  private macCommandsFor(code: string): string[] {
    if (!this.isMacOS()) return [];
    const parts: string[] = [];
    if (this._pressedModifiers.has("Shift")) parts.push("Shift");
    if (this._pressedModifiers.has("Control")) parts.push("Control");
    if (this._pressedModifiers.has("Alt")) parts.push("Alt");
    if (this._pressedModifiers.has("Meta")) parts.push("Meta");
    parts.push(code);
    const shortcut = parts.join("+");
    const table: Record<string, string | string[]> = {
      "Meta+KeyA": "selectAll:",
      "Meta+KeyC": "copy:",
      "Meta+KeyX": "cut:",
      "Meta+KeyV": "paste:",
      "Meta+KeyZ": "undo:",
    };
    const value = table[shortcut];
    if (!value) return [];
    const list = Array.isArray(value) ? value : [value];
    return list
      .filter((c) => !c.startsWith("insert"))
      .map((c) => c.substring(0, c.length - 1));
  }

  // ---- Page-level lifecycle waiter that follows main frame id swaps ----

  /** Resolve the main-world execution context for the current main frame. */
  private async mainWorldExecutionContextId(): Promise<number> {
    return executionContexts.waitForMainWorld(
      this.mainSession,
      this.mainFrameId(),
      1000,
    );
  }

  private async isMainLoadStateReady(
    state: "domcontentloaded" | "load",
  ): Promise<boolean> {
    try {
      const ctxId = await this.mainWorldExecutionContextId();
      const { result } =
        await this.mainSession.send<Protocol.Runtime.EvaluateResponse>(
          "Runtime.evaluate",
          {
            expression: "document.readyState",
            contextId: ctxId,
            returnByValue: true,
          },
        );
      const readyState = String(result?.value ?? "");
      if (state === "domcontentloaded") {
        return readyState === "interactive" || readyState === "complete";
      }
      return readyState === "complete";
    } catch {
      return false;
    }
  }

  /**
   * Wait until the **current** main frame reaches a lifecycle state.
   * - Fast path via `document.readyState`.
   * - Event path listens at the session level and compares incoming `frameId`
   *   to `mainFrameId()` **at event time** to follow root swaps.
   */
  async waitForMainLoadState(
    state: LoadState,
    timeoutMs = 15000,
  ): Promise<void> {
    await this.mainSession
      .send("Page.setLifecycleEventsEnabled", { enabled: true })
      .catch(() => {});

    // Fast path: check the *current* main frame's readyState.
    if (
      (state === "domcontentloaded" || state === "load") &&
      (await this.isMainLoadStateReady(state))
    ) {
      return;
    }

    const wanted = LIFECYCLE_NAME[state];
    return new Promise<void>((resolve, reject) => {
      let done = false;
      let timer: ReturnType<typeof setTimeout> | null = null;
      let pollTimer: ReturnType<typeof setTimeout> | null = null;
      let pollInFlight = false;

      const off = () => {
        this.mainSession.off("Page.lifecycleEvent", onLifecycle);
        this.mainSession.off("Page.domContentEventFired", onDomContent);
        this.mainSession.off("Page.loadEventFired", onLoad);
      };
      const clearPollTimer = () => {
        if (pollTimer) {
          clearTimeout(pollTimer);
          pollTimer = null;
        }
      };

      const finish = () => {
        if (done) return;
        done = true;
        if (timer) {
          clearTimeout(timer);
          timer = null;
        }
        clearPollTimer();
        off();
        resolve();
      };

      const onLifecycle = (evt: Protocol.Page.LifecycleEventEvent) => {
        if (evt.name !== wanted) return;
        // Compare against the *current* main frame id when the event arrives.
        if (evt.frameId === this.mainFrameId()) finish();
      };

      const onDomContent = () => {
        if (state === "domcontentloaded") finish();
      };

      const onLoad = () => {
        if (state === "load") finish();
      };

      this.mainSession.on("Page.lifecycleEvent", onLifecycle);
      // Backups for sites that don't emit lifecycle consistently
      this.mainSession.on("Page.domContentEventFired", onDomContent);
      this.mainSession.on("Page.loadEventFired", onLoad);

      // Fallback polling closes lifecycle-event races in remote environments
      // where readyState has advanced but the corresponding event was missed.
      const pollReadyState = async () => {
        if (done || pollInFlight) return;
        pollInFlight = true;
        try {
          if (done) return;
          if (
            (state === "domcontentloaded" || state === "load") &&
            (await this.isMainLoadStateReady(state))
          ) {
            finish();
            return;
          }
        } finally {
          pollInFlight = false;
        }
        if (!done) {
          clearPollTimer();
          pollTimer = setTimeout(() => {
            void pollReadyState();
          }, 100);
        }
      };
      void pollReadyState();

      timer = setTimeout(() => {
        if (done) return;
        done = true;
        clearPollTimer();
        off();
        reject(
          new Error(
            `waitForMainLoadState(${state}) timed out after ${timeoutMs}ms`,
          ),
        );
      }, timeoutMs);
    });
  }
}


================================================
FILE: packages/core/lib/v3/understudy/piercer.ts
================================================
import type { Protocol } from "devtools-protocol";
import { v3Logger } from "../logger.js";
import type { CDPSessionLike } from "./cdp.js";
import { v3ScriptContent } from "../dom/build/scriptV3Content.js";
import { reRenderScriptContent } from "../dom/build/reRenderScriptContent.js";

export async function installV3PiercerIntoSession(
  session: CDPSessionLike,
): Promise<boolean> {
  const pageEnabled = await session
    .send("Page.enable")
    .then(() => true)
    .catch(() => false);
  if (!pageEnabled) return false;

  await session.send("Runtime.enable").catch(() => {});
  try {
    await session.send<Protocol.Page.AddScriptToEvaluateOnNewDocumentResponse>(
      "Page.addScriptToEvaluateOnNewDocument",
      { source: v3ScriptContent, runImmediately: true },
    );
  } catch (e) {
    const msg = String((e as Error)?.message ?? e ?? "");
    // If the session vanished during attach (common with short-lived OOPIFs),
    // swallow and report failure so callers can early-return.
    if (msg.includes("Session with given id not found")) return false;
    // For other errors, keep going but don't throw — the next evaluate is idempotent.
  }
  await session
    .send<Protocol.Runtime.EvaluateResponse>("Runtime.evaluate", {
      expression: v3ScriptContent,
      returnByValue: true,
      awaitPromise: true,
    })
    .catch(() => {});

  // After the piercer is in place, re-render any custom elements whose
  // shadow roots were created before we patched attachShadow so their
  // closed roots are recreated under the hook.
  await session
    .send<Protocol.Runtime.EvaluateResponse>("Runtime.evaluate", {
      expression: reRenderScriptContent,
      returnByValue: true,
      awaitPromise: false,
    })
    .catch(() => {});
  return true;
}

/** (Optional) stream patch logs in your node console during bring-up */
export function tapPiercerConsole(
  session: CDPSessionLike,
  label: string,
): void {
  session.on<Protocol.Runtime.ConsoleAPICalledEvent>(
    "Runtime.consoleAPICalled",
    (evt) => {
      const head = evt.args?.[0]?.value as string | undefined;
      if (head?.startsWith?.("[v3-piercer]")) {
        v3Logger({
          category: "piercer",
          message: `[${label}] ${head}`,
          level: 2,
          auxiliary: {
            value: {
              value: String(evt.args?.[1]?.value ?? ""),
              type: "string",
            },
          },
        });
      }
    },
  );
}


================================================
FILE: packages/core/lib/v3/understudy/response.ts
================================================
/**
 * Response
 * -----------------
 *
 * This module implements a Playwright-inspired response wrapper that exposes
 * navigation metadata and helpers for retrieving HTTP response bodies. The
 * abstraction is consumed by navigation routines (e.g. `Page.goto`) so callers
 * can synchronously inspect status codes, lazily fetch body text, or await the
 * network layer finishing the request. The implementation is built directly on
 * Chrome DevTools Protocol primitives – it holds the originating `requestId`
 * so it can request payloads via `Network.getResponseBody`, and it listens for
 * `responseReceivedExtraInfo`, `loadingFinished`, and `loadingFailed` events to
 * hydrate the richer header view and resolve callers waiting on completion.
 */

import type { Protocol } from "devtools-protocol";
import type { SerializableResponse } from "../types/private/index.js";
import {
  ResponseBodyError,
  ResponseParseError,
} from "../types/public/sdkErrors.js";
import type { CDPSessionLike } from "./cdp.js";
import type { Frame } from "./frame.js";
import type { Page } from "./page.js";

type ServerAddr = { ipAddress: string; port: number };

export function isSerializableResponse(
  value: unknown,
): value is SerializableResponse {
  if (!value || typeof value !== "object") return false;
  const candidate = value as Partial<SerializableResponse>;
  if (typeof candidate.requestId !== "string") return false;
  if (!candidate.response || typeof candidate.response !== "object") {
    return false;
  }
  return true;
}

/**
 * Minimal deferred helper that lets navigation tracking hand out a promise and
 * later control the resolution from event callbacks. Each response owns a
 * single deferred covering the "finished" promise so consumers can mirror
 * Playwright's `response.finished()` behaviour.
 */
type Deferred<T> = {
  promise: Promise<T>;
  resolve: (value: T) => void;
  reject: (error: Error) => void;
};

function createDeferred<T>(): Deferred<T> {
  let resolve!: (value: T) => void;
  let reject!: (error: Error) => void;
  const promise = new Promise<T>((res, rej) => {
    resolve = res;
    reject = rej;
  });
  return { promise, resolve, reject };
}

/** Normalise header names to lowercase for case-insensitive lookups. */
function normaliseHeaderName(name: string): string {
  return name.toLowerCase();
}

/** Split multi-value header strings into discrete values while trimming. */
function splitHeaderValues(value: string): string[] {
  return value
    .split(/\r?\n/)
    .map((part) => part.trim())
    .filter(Boolean);
}

/**
 * Parse an HTTP header text block (as emitted by CDP) into an ordered array of
 * name/value pairs while preserving the wire casing.
 */
function parseHeadersText(
  headersText: string | undefined,
): Array<{ name: string; value: string }> {
  if (!headersText) return [];
  const lines = headersText.split(/\r?\n/);
  const entries: Array<{ name: string; value: string }> = [];
  for (const line of lines) {
    if (!line || line.startsWith("HTTP/")) continue;
    const index = line.indexOf(":");
    if (index === -1) continue;
    const name = line.slice(0, index).trim();
    const value = line.slice(index + 1).trim();
    entries.push({ name, value });
  }
  return entries;
}

/**
 * Thin wrapper around CDP response metadata that mirrors the ergonomics of
 * Playwright's `Response` class. The class intentionally keeps the same method
 * names so upstream integrations can transition with minimal code changes.
 */
export class Response {
  private readonly page: Page;
  private readonly session: CDPSessionLike;
  private readonly requestId: string;
  private readonly frameId?: string;
  private readonly loaderId?: string;
  private readonly response: Protocol.Network.Response;
  private readonly fromServiceWorkerFlag: boolean;
  private readonly serverAddress?: ServerAddr | null;

  private headersObject: Record<string, string>;
  private headersArrayCache: Array<{ name: string; value: string }> | null =
    null;
  private allHeadersCache: Record<string, string> | null = null;
  private readonly headerValuesMap = new Map<string, string[]>();

  private finishedDeferred = createDeferred<null | Error>();
  private finishedSettled = false;

  private extraInfoHeaders: Protocol.Network.Headers | null = null;
  private extraInfoHeadersText: string | undefined;

  /**
   * Build a response wrapper from the CDP notification associated with a
   * navigation. The constructor captures the owning page/session so follow-up
   * methods (body/text/json) can query CDP on-demand. The `response` payload is
   * the raw `Protocol.Network.Response` object emitted by Chrome.
   */
  constructor(params: {
    page: Page;
    session: CDPSessionLike;
    requestId: string;
    frameId?: string;
    loaderId?: string;
    response: Protocol.Network.Response;
    fromServiceWorker: boolean;
  }) {
    this.page = params.page;
    this.session = params.session;
    this.requestId = params.requestId;
    this.frameId = params.frameId;
    this.loaderId = params.loaderId;
    this.response = params.response;
    this.fromServiceWorkerFlag = params.fromServiceWorker;

    if (
      params.response.remoteIPAddress &&
      params.response.remotePort !== undefined
    ) {
      this.serverAddress = {
        ipAddress: params.response.remoteIPAddress,
        port: params.response.remotePort,
      };
    } else {
      this.serverAddress = null;
    }

    this.headersObject = {};
    for (const [name, value] of Object.entries(this.response.headers ?? {})) {
      const lower = normaliseHeaderName(name);
      if (value === undefined) continue;
      const values = splitHeaderValues(String(value));
      this.headerValuesMap.set(lower, values);
      this.headersObject[lower] = values.join(", ");
    }
  }

  /** URL associated with the navigation request. */
  url(): string {
    return this.response.url;
  }

  /** HTTP status code reported by Chrome. */
  status(): number {
    return this.response.status;
  }

  /** Human-readable status text that accompanied the response. */
  statusText(): string {
    return this.response.statusText;
  }

  /** Convenience predicate that checks for 2xx statuses. */
  ok(): boolean {
    const status = this.status();
    return status >= 200 && status <= 299;
  }

  /** Returns the Stagehand frame object that initiated the navigation. */
  frame(): Frame | null {
    if (!this.frameId) return null;
    try {
      return this.page.frameForId(this.frameId);
    } catch {
      return null;
    }
  }

  /** Indicates whether the response was serviced by a Service Worker. */
  fromServiceWorker(): boolean {
    return this.fromServiceWorkerFlag;
  }

  /**
   * Returns TLS security metadata when provided by the browser. In practice
   * this includes certificate issuer, protocol, and validity interval.
   */
  async securityDetails(): Promise<Protocol.Network.SecurityDetails | null> {
    return this.response.securityDetails ?? null;
  }

  /** Returns the resolved server address for the navigation when available. */
  async serverAddr(): Promise<ServerAddr | null> {
    return this.serverAddress ?? null;
  }

  /**
   * Returns the response headers normalised to lowercase keys. Matches the
   * behaviour of Playwright's `headers()` by eliding duplicate header entries.
   */
  headers(): Record<string, string> {
    return { ...this.headersObject };
  }

  /**
   * Returns all headers including those only surfaced through
   * `responseReceivedExtraInfo` such as `set-cookie`. Values are reported as the
   * browser sends them (no further splitting or concatenation).
   */
  async allHeaders(): Promise<Record<string, string>> {
    if (this.allHeadersCache) return { ...this.allHeadersCache };
    const source = this.extraInfoHeaders ?? this.response.headers ?? {};
    const map: Record<string, string> = {};
    for (const [name, value] of Object.entries(source)) {
      map[name] = String(value);
    }
    this.allHeadersCache = map;
    return { ...map };
  }

  /** Returns a concatenated header string for the supplied header name. */
  async headerValue(name: string): Promise<string | null> {
    const values = await this.headerValues(name);
    if (!values.length) return null;
    return values.join(", ");
  }

  /** Returns all values for a header (case-insensitive lookup). */
  async headerValues(name: string): Promise<string[]> {
    const lower = normaliseHeaderName(name);
    if (this.extraInfoHeaders) {
      const raw = this.extraInfoHeaders[name] ?? this.extraInfoHeaders[lower];
      if (raw !== undefined) {
        return splitHeaderValues(String(raw));
      }
    }
    const values = this.headerValuesMap.get(lower);
    return values ? [...values] : [];
  }

  /**
   * Returns header entries preserving their original wire casing and ordering.
   * Falls back to the CDP object when the raw header text is unavailable.
   */
  async headersArray(): Promise<Array<{ name: string; value: string }>> {
    if (this.headersArrayCache) return [...this.headersArrayCache];

    const entriesFromText = parseHeadersText(this.extraInfoHeadersText);
    if (entriesFromText.length > 0) {
      this.headersArrayCache = entriesFromText;
      return [...entriesFromText];
    }

    const entries: Array<{ name: string; value: string }> = [];
    const source = this.extraInfoHeaders ?? this.response.headers ?? {};
    for (const [name, value] of Object.entries(source)) {
      const values = splitHeaderValues(String(value));
      for (const val of values) {
        entries.push({ name, value: val });
      }
    }
    this.headersArrayCache = entries;
    return [...entries];
  }

  /**
   * Requests the raw response body from Chrome DevTools Protocol. The method is
   * intentionally lazy because not every caller needs the payload, and CDP only
   * allows retrieving it once the response completes.
   */
  async body(): Promise<Buffer> {
    const result = await this.session
      .send<Protocol.Network.GetResponseBodyResponse>(
        "Network.getResponseBody",
        { requestId: this.requestId },
      )
      .catch((error) => {
        throw new ResponseBodyError(String(error));
      });

    if (result.base64Encoded) {
      return Buffer.from(result.body, "base64");
    }
    return Buffer.from(result.body, "utf-8");
  }

  /** Decodes the response body as UTF-8 text. */
  async text(): Promise<string> {
    const buffer = await this.body();
    return buffer.toString("utf-8");
  }

  /** Parses the response body as JSON and throws if parsing fails. */
  async json<T = unknown>(): Promise<T> {
    const text = await this.text();
    try {
      return JSON.parse(text) as T;
    } catch (error) {
      throw new ResponseParseError(String(error));
    }
  }

  /**
   * Resolves once the underlying network request completes or fails. Mirrors
   * Playwright's behaviour by resolving to `null` on success and to an `Error`
   * instance when Chrome reports `Network.loadingFailed`.
   */
  async finished(): Promise<null | Error> {
    return this.finishedDeferred.promise;
  }

  /**
   * Internal helper invoked by the navigation tracker when CDP reports extra
   * header information. This keeps the cached header views in sync with the
   * richer metadata.
   */
  public applyExtraInfo(
    event: Protocol.Network.ResponseReceivedExtraInfoEvent,
  ): void {
    this.extraInfoHeaders = event.headers;
    this.extraInfoHeadersText = event.headersText;
    this.allHeadersCache = null;
    this.headersArrayCache = null;
    this.headersObject = {};
    this.headerValuesMap.clear();

    const source = event.headers ?? {};
    for (const [name, value] of Object.entries(source)) {
      const lower = normaliseHeaderName(name);
      const segments = splitHeaderValues(String(value));
      this.headerValuesMap.set(lower, segments);
      this.headersObject[lower] = segments.join(", ");
    }
  }

  /**
   * Internal helper for creating a Response object from a Serializable
   * goto response from the Stagehand API
   */
  public static fromSerializable(
    serialized: SerializableResponse,
    context: { page: Page; session: CDPSessionLike },
  ): Response {
    const reconstructed = new Response({
      page: context.page,
      session: context.session,
      requestId: serialized.requestId,
      frameId: serialized.frameId,
      loaderId: serialized.loaderId,
      response: serialized.response as Protocol.Network.Response,
      fromServiceWorker: serialized.fromServiceWorkerFlag ?? false,
    });

    if (serialized.extraInfoHeaders) {
      reconstructed.applyExtraInfo({
        requestId: serialized.requestId,
        headers: serialized.extraInfoHeaders,
        headersText: serialized.extraInfoHeadersText,
      } as Protocol.Network.ResponseReceivedExtraInfoEvent);
    }

    if (serialized.finishedSettled) {
      reconstructed.markFinished(null);
    }

    return reconstructed;
  }

  /** Marks the response as finished and resolves the `finished()` promise. */
  public markFinished(error: Error | null): void {
    if (this.finishedSettled) return;
    this.finishedSettled = true;
    if (error) {
      this.finishedDeferred.resolve(error);
    } else {
      this.finishedDeferred.resolve(null);
    }
  }
}


================================================
FILE: packages/core/lib/v3/understudy/screenshotUtils.ts
================================================
import { Protocol } from "devtools-protocol";
import type { CDPSessionLike } from "./cdp.js";
import type { Frame } from "./frame.js";
import type { Locator } from "./locator.js";
import type { Page } from "./page.js";
import type {
  ScreenshotClip,
  ScreenshotScaleOption,
} from "../types/public/screenshotTypes.js";
import { StagehandInvalidArgumentError } from "../types/public/sdkErrors.js";
import { screenshotScriptSources } from "../dom/build/screenshotScripts.generated.js";

export type ScreenshotCleanup = () => Promise<void> | void;

export function collectFramesForScreenshot(page: Page): Frame[] {
  const seen = new Map<string, Frame>();
  const main = page.mainFrame();
  seen.set(main.frameId, main);
  for (const frame of page.frames()) {
    seen.set(frame.frameId, frame);
  }
  return Array.from(seen.values());
}

export function normalizeScreenshotClip(clip: ScreenshotClip): ScreenshotClip {
  const x = Number(clip.x);
  const y = Number(clip.y);
  const width = Number(clip.width);
  const height = Number(clip.height);

  for (const [key, value] of Object.entries({ x, y, width, height })) {
    if (!Number.isFinite(value)) {
      throw new StagehandInvalidArgumentError(
        `screenshot: clip.${key} must be a finite number`,
      );
    }
  }

  if (width <= 0 || height <= 0) {
    throw new StagehandInvalidArgumentError(
      "screenshot: clip width/height must be positive",
    );
  }

  return { x, y, width, height };
}

export async function computeScreenshotScale(
  page: Page,
  mode: ScreenshotScaleOption,
): Promise<number | undefined> {
  if (mode !== "css") return undefined;
  try {
    const frame = page.mainFrame();
    const dpr = await frame
      .evaluate(() => {
        const ratio = Number(window.devicePixelRatio || 1);
        return Number.isFinite(ratio) && ratio > 0 ? ratio : 1;
      })
      .catch(() => 1);
    const safeRatio = Number.isFinite(dpr) && dpr > 0 ? dpr : 1;
    return Math.min(2, Math.max(0.1, 1 / safeRatio));
  } catch {
    return 1;
  }
}

export async function setTransparentBackground(
  session: CDPSessionLike,
): Promise<ScreenshotCleanup> {
  await session
    .send("Emulation.setDefaultBackgroundColorOverride", {
      color: { r: 0, g: 0, b: 0, a: 0 },
    })
    .catch(() => {});

  return async () => {
    await session
      .send("Emulation.setDefaultBackgroundColorOverride", {})
      .catch(() => {});
  };
}

export async function applyStyleToFrames(
  frames: Frame[],
  css: string,
  label: string,
): Promise<ScreenshotCleanup> {
  const trimmed = css.trim();
  if (!trimmed) return async () => {};
  const token = `__v3_style_${label}_${Date.now()}_${Math.random()
    .toString(36)
    .slice(2)}`;

  await Promise.all(
    frames.map((frame) =>
      frame
        .evaluate(
          ({ css, token }) => {
            try {
              const doc = document;
              if (!doc) return;
              const style = doc.createElement("style");
              style.setAttribute("data-stagehand-style", token);
              style.textContent = css;
              const parent = doc.head || doc.documentElement || doc.body;
              parent?.appendChild(style);
            } catch {
              // ignore
            }
          },
          { css: trimmed, token },
        )
        .catch(() => {}),
    ),
  );

  return async () => {
    await Promise.all(
      frames.map((frame) =>
        frame
          .evaluate((token) => {
            try {
              const doc = document;
              if (!doc) return;
              const nodes = doc.querySelectorAll(
                `[data-stagehand-style="${token}"]`,
              );
              nodes.forEach((node) => node.remove());
            } catch {
              // ignore
            }
          }, token)
          .catch(() => {}),
      ),
    );
  };
}

export async function disableAnimations(
  frames: Frame[],
): Promise<ScreenshotCleanup> {
  const css = `
*,
*::before,
*::after {
  animation-delay: 0s !important;
  animation-duration: 0s !important;
  animation-iteration-count: 1 !important;
  animation-play-state: paused !important;
  transition-property: none !important;
  transition-duration: 0s !important;
  transition-delay: 0s !important;
}`;

  const cleanup = await applyStyleToFrames(frames, css, "animations");

  await Promise.all(
    frames.map((frame) =>
      frame
        .evaluate(() => {
          try {
            const animations =
              typeof document.getAnimations === "function"
                ? document.getAnimations()
                : [];
            for (const animation of animations) {
              try {
                const details = animation.effect?.getComputedTiming?.();
                if (details && details.iterations !== Infinity) {
                  animation.finish?.();
                } else {
                  animation.cancel?.();
                }
              } catch {
                animation.cancel?.();
              }
            }
          } catch {
            // ignore
          }
        })
        .catch(() => {}),
    ),
  );

  return cleanup;
}

export async function hideCaret(frames: Frame[]): Promise<ScreenshotCleanup> {
  const css = `
input,
textarea,
[contenteditable],
[contenteditable=""],
[contenteditable="true"],
[contenteditable="plaintext-only"],
*:focus {
  caret-color: transparent !important;
}`;

  return applyStyleToFrames(frames, css, "caret");
}

export async function applyMaskOverlays(
  locators: Locator[],
  color: string,
): Promise<ScreenshotCleanup> {
  type MaskRectSpec = ScreenshotClip & { rootToken?: string | null };
  const rectsByFrame = new Map<
    Frame,
    { rects: MaskRectSpec[]; rootTokens: Set<string> }
  >();

  const token = `__v3_mask_${Date.now()}_${Math.random().toString(36).slice(2)}`;

  for (const locator of locators) {
    try {
      const info = await resolveMaskRects(locator, token);
      if (!info) continue;
      const entry = rectsByFrame.get(info.frame) ?? {
        rects: [],
        rootTokens: new Set<string>(),
      };
      entry.rects.push(...info.rects);
      for (const rect of info.rects) {
        if (rect.rootToken) entry.rootTokens.add(rect.rootToken);
      }
      rectsByFrame.set(info.frame, entry);
    } catch {
      // ignore individual locator failures
    }
  }

  if (rectsByFrame.size === 0) {
    return async () => {};
  }

  await Promise.all(
    Array.from(rectsByFrame.entries()).map(([frame, { rects }]) =>
      frame
        .evaluate(
          ({ rects, color, token }) => {
            try {
              const doc = document;
              if (!doc) return;
              for (const rect of rects) {
                const defaultRoot = doc.documentElement || doc.body;
                if (!defaultRoot) return;
                const root = rect.rootToken
                  ? doc.querySelector(
                      `[data-stagehand-mask-root="${rect.rootToken}"]`,
                    ) || defaultRoot
                  : defaultRoot;
                if (!root) continue;
                if (rect.rootToken) {
                  try {
                    const style = window.getComputedStyle(root as Element);
                    if (style && style.position === "static") {
                      const rootEl = root as HTMLElement;
                      if (
                        !rootEl.hasAttribute("data-stagehand-mask-root-pos")
                      ) {
                        rootEl.setAttribute(
                          "data-stagehand-mask-root-pos",
                          rootEl.style.position || "",
                        );
                      }
                      rootEl.style.position = "relative";
                    }
                  } catch {
                    // ignore
                  }
                }
                const el = doc.createElement("div");
                el.setAttribute("data-stagehand-mask", token);
                el.style.position = "absolute";
                el.style.left = `${rect.x}px`;
                el.style.top = `${rect.y}px`;
                el.style.width = `${rect.width}px`;
                el.style.height = `${rect.height}px`;
                el.style.backgroundColor = color;
                el.style.pointerEvents = "none";
                el.style.zIndex = "2147483647";
                el.style.opacity = "1";
                el.style.mixBlendMode = "normal";
                (root as Element).appendChild(el);
              }
            } catch {
              // ignore
            }
          },
          { rects, color, token },
        )
        .catch(() => {}),
    ),
  );

  return async () => {
    await Promise.all(
      Array.from(rectsByFrame.entries()).map(([frame, { rootTokens }]) =>
        frame
          .evaluate(
            ({ token, rootTokens }) => {
              try {
                const doc = document;
                if (!doc) return;
                const nodes = doc.querySelectorAll(
                  `[data-stagehand-mask="${token}"]`,
                );
                nodes.forEach((node) => node.remove());
                for (const rootToken of rootTokens) {
                  const root = doc.querySelector(
                    `[data-stagehand-mask-root="${rootToken}"]`,
                  ) as HTMLElement | null;
                  if (!root) continue;
                  const prev = root.getAttribute(
                    "data-stagehand-mask-root-pos",
                  );
                  if (prev !== null) {
                    root.style.position = prev;
                    root.removeAttribute("data-stagehand-mask-root-pos");
                  }
                  root.removeAttribute("data-stagehand-mask-root");
                }
              } catch {
                // ignore
              }
            },
            { token, rootTokens: Array.from(rootTokens) },
          )
          .catch(() => {}),
      ),
    );
  };
}

async function resolveMaskRects(
  locator: Locator,
  maskToken: string,
): Promise<{
  frame: Frame;
  rects: Array<ScreenshotClip & { rootToken?: string | null }>;
} | null> {
  const frame = locator.getFrame();
  const session = frame.session;
  try {
    const resolved: Array<{
      objectId: Protocol.Runtime.RemoteObjectId;
      nodeId: Protocol.DOM.NodeId | null;
    }> = await locator.resolveNodesForMask();
    const rects: Array<ScreenshotClip & { rootToken?: string | null }> = [];

    for (const { objectId } of resolved) {
      try {
        const rect = await resolveMaskRectForObject(
          session,
          objectId,
          maskToken,
        );
        if (rect) rects.push(rect);
      } catch {
        // ignore individual element failures
      } finally {
        await session
          .send<never>("Runtime.releaseObject", { objectId })
          .catch(() => {});
      }
    }

    if (!rects.length) return null;

    return { frame, rects };
  } catch {
    return null;
  }
}

async function resolveMaskRectForObject(
  session: CDPSessionLike,
  objectId: Protocol.Runtime.RemoteObjectId,
  maskToken: string,
): Promise<(ScreenshotClip & { rootToken?: string | null }) | null> {
  const result = await session.send<Protocol.Runtime.CallFunctionOnResponse>(
    "Runtime.callFunctionOn",
    {
      objectId,
      functionDeclaration: screenshotScriptSources.resolveMaskRect,
      arguments: [{ value: maskToken }],
      returnByValue: true,
    },
  );

  if (result.exceptionDetails) {
    return null;
  }

  const rect = result.result.value as
    | (ScreenshotClip & { rootToken?: string | null })
    | null;
  if (!rect) return null;

  const { x, y, width, height } = rect;
  if (
    !Number.isFinite(x) ||
    !Number.isFinite(y) ||
    !Number.isFinite(width) ||
    !Number.isFinite(height) ||
    width <= 0 ||
    height <= 0
  ) {
    return null;
  }

  return {
    x,
    y,
    width,
    height,
    rootToken:
      rect.rootToken && typeof rect.rootToken === "string"
        ? rect.rootToken
        : undefined,
  };
}

export async function runScreenshotCleanups(
  cleanups: ScreenshotCleanup[],
): Promise<void> {
  for (let i = cleanups.length - 1; i >= 0; i -= 1) {
    const fn = cleanups[i];
    if (!fn) continue;
    try {
      const result = fn();
      if (result && typeof (result as Promise<void>).then === "function") {
        await result;
      }
    } catch {
      // ignore cleanup errors
    }
  }
}


================================================
FILE: packages/core/lib/v3/understudy/selectorResolver.ts
================================================
import type { Protocol } from "devtools-protocol";
import {
  locatorScriptBootstrap,
  locatorScriptGlobalRefs,
  type LocatorScriptName,
} from "../dom/build/locatorScripts.generated.js";
import { v3Logger } from "../logger.js";
import type { Frame } from "./frame.js";
import { executionContexts } from "./executionContextRegistry.js";

export type SelectorQuery =
  | { kind: "css"; value: string }
  | { kind: "text"; value: string }
  | { kind: "xpath"; value: string };

export interface ResolvedNode {
  objectId: Protocol.Runtime.RemoteObjectId;
  nodeId: Protocol.DOM.NodeId | null;
}

export interface ResolveManyOptions {
  limit?: number;
}

export class FrameSelectorResolver {
  constructor(private readonly frame: Frame) {}

  public static parseSelector(raw: string): SelectorQuery {
    const trimmed = raw.trim();

    const isText = /^text=/i.test(trimmed);
    const looksLikeXPath =
      /^xpath=/i.test(trimmed) ||
      trimmed.startsWith("/") ||
      trimmed.startsWith("(");
    const isCssPrefixed = /^css=/i.test(trimmed);

    if (isText) {
      let value = trimmed.replace(/^text=/i, "").trim();
      if (
        (value.startsWith('"') && value.endsWith('"')) ||
        (value.startsWith("'") && value.endsWith("'"))
      ) {
        value = value.slice(1, -1);
      }
      return { kind: "text", value };
    }

    if (looksLikeXPath) {
      const value = trimmed.replace(/^xpath=/i, "");
      return { kind: "xpath", value };
    }

    let selector = isCssPrefixed ? trimmed.replace(/^css=/i, "") : trimmed;
    if (selector.includes(">>")) {
      selector = selector
        .split(">>")
        .map((piece) => piece.trim())
        .filter(Boolean)
        .join(" ");
    }

    return { kind: "css", value: selector };
  }

  public async resolveFirst(
    query: SelectorQuery,
  ): Promise<ResolvedNode | null> {
    return this.resolveAtIndex(query, 0);
  }

  public async resolveAll(
    query: SelectorQuery,
    { limit = Infinity }: ResolveManyOptions = {},
  ): Promise<ResolvedNode[]> {
    if (limit <= 0) return [];
    switch (query.kind) {
      case "css":
        return this.resolveCss(query.value, limit);
      case "text":
        return this.resolveText(query.value, limit);
      case "xpath":
        return this.resolveXPath(query.value, limit);
      default:
        return [];
    }
  }

  public async count(query: SelectorQuery): Promise<number> {
    switch (query.kind) {
      case "css":
        return this.countCss(query.value);
      case "text":
        return this.countText(query.value);
      case "xpath":
        return this.countXPath(query.value);
      default:
        return 0;
    }
  }

  public async resolveAtIndex(
    query: SelectorQuery,
    index: number,
  ): Promise<ResolvedNode | null> {
    if (index < 0 || !Number.isFinite(index)) return null;
    const results = await this.resolveAll(query, { limit: index + 1 });
    return results[index] ?? null;
  }

  private buildLocatorInvocation(
    name: LocatorScriptName,
    args: string[],
  ): string {
    const call = `${locatorScriptGlobalRefs[name]}(${args.join(", ")})`;
    return `(() => { ${locatorScriptBootstrap}; return ${call}; })()`;
  }

  private async resolveCss(
    selector: string,
    limit: number,
  ): Promise<ResolvedNode[]> {
    if (limit <= 0) return [];

    const session = this.frame.session;
    const { executionContextId } = await session.send<{
      executionContextId: Protocol.Runtime.ExecutionContextId;
    }>("Page.createIsolatedWorld", {
      frameId: this.frame.frameId,
      worldName: "v3-world",
    });

    const ctxId = await executionContexts.waitForMainWorld(
      session,
      this.frame.frameId,
      1000,
    );

    const results: ResolvedNode[] = [];
    let loggedFallback = false;

    for (let index = 0; index < limit; index += 1) {
      const primaryExpr = this.buildLocatorInvocation("resolveCssSelector", [
        JSON.stringify(selector),
        String(index),
      ]);
      const primary = await this.evaluateElement(
        primaryExpr,
        executionContextId,
      );
      if (primary) {
        results.push(primary);
        continue;
      }

      if (!loggedFallback) {
        v3Logger({
          category: "locator",
          message: "css pierce-fallback",
          level: 2,
          auxiliary: {
            frameId: { value: String(this.frame.frameId), type: "string" },
            selector: { value: selector, type: "string" },
          },
        });
        loggedFallback = true;
      }

      const fallbackExpr = this.buildLocatorInvocation(
        "resolveCssSelectorPierce",
        [JSON.stringify(selector), String(index)],
      );
      const fallback = await this.evaluateElement(fallbackExpr, ctxId);
      if (fallback) {
        results.push(fallback);
        continue;
      }

      break;
    }

    return results;
  }

  private async resolveText(
    value: string,
    limit: number,
  ): Promise<ResolvedNode[]> {
    if (limit <= 0) return [];

    const session = this.frame.session;
    const ctxId = await executionContexts.waitForMainWorld(
      session,
      this.frame.frameId,
      1000,
    );

    const results: ResolvedNode[] = [];
    for (let index = 0; index < limit; index += 1) {
      const expr = this.buildLocatorInvocation("resolveTextSelector", [
        JSON.stringify(value),
        String(index),
      ]);
      const resolved = await this.evaluateElement(expr, ctxId);
      if (!resolved) break;
      results.push(resolved);
    }

    return results;
  }

  private async resolveXPath(
    value: string,
    limit: number,
  ): Promise<ResolvedNode[]> {
    if (limit <= 0) return [];

    const session = this.frame.session;
    const ctxId = await executionContexts.waitForMainWorld(
      session,
      this.frame.frameId,
      1000,
    );

    const results: ResolvedNode[] = [];
    for (let index = 0; index < limit; index += 1) {
      const expr = this.buildLocatorInvocation("resolveXPathMainWorld", [
        JSON.stringify(value),
        String(index),
      ]);
      const resolved = await this.evaluateElement(expr, ctxId);
      if (!resolved) break;
      results.push(resolved);
    }

    return results;
  }

  private async countCss(selector: string): Promise<number> {
    const session = this.frame.session;

    const { executionContextId } = await session.send<{
      executionContextId: Protocol.Runtime.ExecutionContextId;
    }>("Page.createIsolatedWorld", {
      frameId: this.frame.frameId,
      worldName: "v3-world",
    });

    const primaryExpr = this.buildLocatorInvocation("countCssMatchesPrimary", [
      JSON.stringify(selector),
    ]);
    const primary = await this.evaluateCount(primaryExpr, executionContextId);

    const ctxId = await executionContexts.waitForMainWorld(
      session,
      this.frame.frameId,
      1000,
    );

    const fallbackExpr = this.buildLocatorInvocation("countCssMatchesPierce", [
      JSON.stringify(selector),
    ]);
    const fallback = await this.evaluateCount(fallbackExpr, ctxId);

    return Math.max(primary, fallback);
  }

  private async countText(value: string): Promise<number> {
    const session = this.frame.session;
    const ctxId = await executionContexts.waitForMainWorld(
      session,
      this.frame.frameId,
      1000,
    );

    const expr = this.buildLocatorInvocation("countTextMatches", [
      JSON.stringify(value),
    ]);

    try {
      const evalRes = await session.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression: expr,
          contextId: ctxId,
          returnByValue: true,
          awaitPromise: true,
        },
      );

      if (evalRes.exceptionDetails) {
        const details = evalRes.exceptionDetails;
        v3Logger({
          category: "locator",
          message: "count text evaluate exception",
          level: 0,
          auxiliary: {
            frameId: { value: String(this.frame.frameId), type: "string" },
            selector: { value: value, type: "string" },
            exception: {
              value:
                details.text ??
                String(
                  details.exception?.description ??
                    details.exception?.value ??
                    "",
                ),
              type: "string",
            },
          },
        });
        return 0;
      }

      const data = (evalRes.result.value ?? {}) as {
        count?: unknown;
      };

      const num =
        typeof data.count === "number" ? data.count : Number(data.count);
      if (!Number.isFinite(num)) return 0;
      return Math.max(0, Math.floor(num));
    } catch {
      return 0;
    }
  }

  private async countXPath(value: string): Promise<number> {
    const session = this.frame.session;

    const ctxId = await executionContexts.waitForMainWorld(
      session,
      this.frame.frameId,
      1000,
    );

    const expr = this.buildLocatorInvocation("countXPathMatchesMainWorld", [
      JSON.stringify(value),
    ]);

    try {
      const evalRes = await session.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression: expr,
          contextId: ctxId,
          returnByValue: true,
          awaitPromise: true,
        },
      );

      if (evalRes.exceptionDetails) {
        return 0;
      }

      const num =
        typeof evalRes.result.value === "number"
          ? evalRes.result.value
          : Number(evalRes.result.value);
      if (!Number.isFinite(num)) return 0;
      return Math.max(0, Math.floor(num));
    } catch {
      return 0;
    }
  }

  private async resolveFromObjectId(
    objectId: Protocol.Runtime.RemoteObjectId,
  ): Promise<ResolvedNode | null> {
    const session = this.frame.session;
    let nodeId: Protocol.DOM.NodeId | null;
    try {
      const rn = await session.send<{ nodeId: Protocol.DOM.NodeId }>(
        "DOM.requestNode",
        { objectId },
      );
      nodeId = rn.nodeId ?? null;
    } catch {
      nodeId = null;
    }

    return { objectId, nodeId };
  }

  private async evaluateCount(
    expression: string,
    contextId: Protocol.Runtime.ExecutionContextId,
  ): Promise<number> {
    const session = this.frame.session;

    try {
      const evalRes = await session.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression,
          contextId,
          returnByValue: true,
          awaitPromise: true,
        },
      );

      if (evalRes.exceptionDetails) {
        return 0;
      }

      const value = evalRes.result.value;
      const num = typeof value === "number" ? value : Number(value);
      if (!Number.isFinite(num)) return 0;
      return Math.max(0, Math.floor(num));
    } catch {
      return 0;
    }
  }

  private async evaluateElement(
    expression: string,
    contextId: Protocol.Runtime.ExecutionContextId,
  ): Promise<ResolvedNode | null> {
    const session = this.frame.session;

    try {
      const evalRes = await session.send<Protocol.Runtime.EvaluateResponse>(
        "Runtime.evaluate",
        {
          expression,
          contextId,
          returnByValue: false,
          awaitPromise: true,
        },
      );

      if (evalRes.exceptionDetails || !evalRes.result.objectId) {
        return null;
      }

      return this.resolveFromObjectId(evalRes.result.objectId);
    } catch {
      return null;
    }
  }
}


================================================
FILE: packages/core/lib/v3/v3.ts
================================================
import fs from "fs";
import os from "os";
import path from "path";
import process from "process";
import { v7 as uuidv7 } from "uuid";
import { z } from "zod";
import {
  InferStagehandSchema,
  StagehandZodSchema,
  toJsonSchema,
} from "./zodCompat.js";
import { loadApiKeyFromEnv } from "../utils.js";
import { extractModelName } from "../modelUtils.js";
import { StagehandLogger, LoggerOptions } from "../logger.js";
import { ActCache } from "./cache/ActCache.js";
import { AgentCache } from "./cache/AgentCache.js";
import { CacheStorage } from "./cache/CacheStorage.js";
import { ActHandler } from "./handlers/actHandler.js";
import { ExtractHandler } from "./handlers/extractHandler.js";
import { ObserveHandler } from "./handlers/observeHandler.js";
import { V3AgentHandler } from "./handlers/v3AgentHandler.js";
import { V3CuaAgentHandler } from "./handlers/v3CuaAgentHandler.js";
import { CAPTCHA_CUA_SYSTEM_PROMPT_NOTE } from "./agent/utils/captchaSolver.js";
import { createBrowserbaseSession } from "./launch/browserbase.js";
import { launchLocalChrome } from "./launch/local.js";
import { LLMClient } from "./llm/LLMClient.js";
import { LLMProvider } from "./llm/LLMProvider.js";
import {
  bindInstanceLogger,
  unbindInstanceLogger,
  withInstanceLogContext,
} from "./logger.js";
import { cleanupLocalBrowser } from "./shutdown/cleanupLocal.js";
import { startShutdownSupervisor } from "./shutdown/supervisorClient.js";
import { resolveTools } from "./mcp/utils.js";
import {
  ActHandlerParams,
  ExtractHandlerParams,
  ObserveHandlerParams,
  AgentReplayStep,
  InitState,
  AgentCacheContext,
} from "./types/private/index.js";
import type {
  ShutdownSupervisorConfig,
  ShutdownSupervisorHandle,
} from "./types/private/shutdown.js";
import {
  AgentConfig,
  AgentExecuteCallbacks,
  AgentExecuteOptions,
  AgentStreamExecuteOptions,
  AgentResult,
  AVAILABLE_CUA_MODELS,
  LogLine,
  StagehandMetrics,
  Action,
  ActOptions,
  ActResult,
  defaultExtractSchema,
  ExtractOptions,
  HistoryEntry,
  ObserveOptions,
  pageTextSchema,
  V3FunctionName,
  AvailableModel,
  ClientOptions,
  ModelConfiguration,
  LocalBrowserLaunchOptions,
  V3Options,
  AnyPage,
  PatchrightPage,
  PlaywrightPage,
  PuppeteerPage,
  CuaModelRequiredError,
  StagehandInvalidArgumentError,
  StagehandNotInitializedError,
  MissingEnvironmentVariableError,
  StagehandInitError,
  AgentStreamResult,
} from "./types/public/index.js";
import { V3Context } from "./understudy/context.js";
import { Page } from "./understudy/page.js";
import { resolveModel } from "../modelUtils.js";
import { StagehandAPIClient } from "./api.js";
import { validateExperimentalFeatures } from "./agent/utils/validateExperimentalFeatures.js";
import { flattenVariables } from "./agent/utils/variables.js";
import { FlowLogger, type FlowLoggerContext } from "./flowlogger/FlowLogger.js";
import { EventEmitterWithWildcardSupport } from "./flowlogger/EventEmitter.js";
import { EventStore } from "./flowlogger/EventStore.js";
import { createTimeoutGuard } from "./handlers/handlerUtils/timeoutGuard.js";
import { ActTimeoutError } from "./types/public/sdkErrors.js";

const DEFAULT_MODEL_NAME = "openai/gpt-4.1-mini";
const DEFAULT_VIEWPORT = { width: 1288, height: 711 };
const DEFAULT_AGENT_TOOL_TIMEOUT_MS = 45000;

type ResolvedModelConfiguration = {
  modelName: AvailableModel;
  clientOptions?: ClientOptions;
};

function resolveModelConfiguration(
  model?: V3Options["model"],
): ResolvedModelConfiguration {
  if (!model) {
    return { modelName: DEFAULT_MODEL_NAME };
  }

  if (typeof model === "string") {
    return { modelName: model as AvailableModel };
  }

  if (model && typeof model === "object") {
    const { modelName, ...clientOptions } = model;
    if (!modelName) {
      throw new StagehandInvalidArgumentError(
        "model.modelName is required when providing client options.",
      );
    }
    return {
      modelName,
      clientOptions: clientOptions as ClientOptions,
    };
  }

  return { modelName: DEFAULT_MODEL_NAME };
}

/**
 * V3
 *
 * Purpose:
 * A high-level orchestrator for Stagehand V3. Abstracts away whether the browser
 * runs **locally via Chrome** or remotely on **Browserbase**, and exposes simple
 * entrypoints (`act`, `extract`, `observe`) that delegate to the corresponding
 * handler classes.
 *
 * Responsibilities:
 * - Bootstraps Chrome or Browserbase, ensures a working CDP WebSocket, and builds a `V3Context`.
 * - Manages lifecycle: init, context access, cleanup.
 * - Bridges external page objects (Playwright/Puppeteer) into internal frameIds for handlers.
 * - Provides a stable API surface for downstream code regardless of runtime environment.
 */
export class V3 {
  private readonly opts: V3Options;
  private state: InitState = { kind: "UNINITIALIZED" };
  private actHandler: ActHandler | null = null;
  private extractHandler: ExtractHandler | null = null;
  private observeHandler: ObserveHandler | null = null;
  private ctx: V3Context | null = null;
  public llmClient!: LLMClient;

  /**
   * Event bus for internal communication.
   * Emits events like 'screenshot' when screenshots are captured during agent execution.
   */
  public readonly bus: EventEmitterWithWildcardSupport =
    new EventEmitterWithWildcardSupport();
  private modelName: AvailableModel;
  private modelClientOptions: ClientOptions;
  private llmProvider: LLMProvider;
  private overrideLlmClients: Map<string, LLMClient> = new Map();
  private readonly domSettleTimeoutMs?: number;
  private _isClosing = false;
  public browserbaseSessionId?: string;
  private browserbaseSessionUrl?: string;
  private browserbaseDebugUrl?: string;
  public get browserbaseSessionID(): string | undefined {
    return this.browserbaseSessionId;
  }
  public get browserbaseSessionURL(): string | undefined {
    return this.browserbaseSessionUrl;
  }
  public get browserbaseDebugURL(): string | undefined {
    return this.browserbaseDebugUrl;
  }
  /**
   * Returns true if the browser is running on Browserbase.
   */
  public get isBrowserbase(): boolean {
    return this.state.kind === "BROWSERBASE";
  }

  /**
   * Returns true if captcha auto-solving is enabled on Browserbase.
   * Defaults to true when not explicitly set to false.
   */
  public get isCaptchaAutoSolveEnabled(): boolean {
    return (
      this.isBrowserbase &&
      this.opts.browserbaseSessionCreateParams?.browserSettings
        ?.solveCaptchas !== false
    );
  }

  /**
   * Returns true if advancedStealth is enabled in Browserbase settings.
   */
  public get isAdvancedStealth(): boolean {
    return (
      this.opts.browserbaseSessionCreateParams?.browserSettings
        ?.advancedStealth === true
    );
  }

  /**
   * Returns the configured viewport dimensions from launch options.
   * Falls back to default 1288x711 if not configured.
   */
  public get configuredViewport(): { width: number; height: number } {
    const defaultWidth = 1288;
    const defaultHeight = 711;

    if (this.opts.env === "BROWSERBASE") {
      const vp =
        this.opts.browserbaseSessionCreateParams?.browserSettings?.viewport;
      return {
        width: vp?.width ?? defaultWidth,
        height: vp?.height ?? defaultHeight,
      };
    }

    // LOCAL env
    const vp = this.opts.localBrowserLaunchOptions?.viewport;
    return {
      width: vp?.width ?? defaultWidth,
      height: vp?.height ?? defaultHeight,
    };
  }

  private _onCdpClosed = (why: string) => {
    if (this.state.kind === "BROWSERBASE") {
      void this._logBrowserbaseSessionStatus();
    }

    // Single place to react to the transport closing
    this._immediateShutdown(`CDP transport closed: ${why}`).catch(() => {});
  };
  public readonly experimental: boolean = false;
  public readonly logInferenceToFile: boolean = false;
  public readonly disableAPI: boolean = false;
  private externalLogger?: (logLine: LogLine) => void;
  public verbose: 0 | 1 | 2 = 1;
  private stagehandLogger: StagehandLogger;
  private _history: Array<HistoryEntry> = [];
  private readonly instanceId: string;
  private readonly sessionId: string;
  public readonly eventStore: EventStore;
  public readonly flowLoggerContext: FlowLoggerContext;
  private static _processGuardsInstalled = false;
  private static _instances: Set<V3> = new Set();
  private cacheStorage: CacheStorage;
  private actCache: ActCache;
  private agentCache: AgentCache;
  private apiClient: StagehandAPIClient | null = null;
  private keepAlive?: boolean;
  private shutdownSupervisor: ShutdownSupervisorHandle | null = null;

  public stagehandMetrics: StagehandMetrics = {
    actPromptTokens: 0,
    actCompletionTokens: 0,
    actReasoningTokens: 0,
    actCachedInputTokens: 0,
    actInferenceTimeMs: 0,
    extractPromptTokens: 0,
    extractCompletionTokens: 0,
    extractReasoningTokens: 0,
    extractCachedInputTokens: 0,
    extractInferenceTimeMs: 0,
    observePromptTokens: 0,
    observeCompletionTokens: 0,
    observeReasoningTokens: 0,
    observeCachedInputTokens: 0,
    observeInferenceTimeMs: 0,
    agentPromptTokens: 0,
    agentCompletionTokens: 0,
    agentReasoningTokens: 0,
    agentCachedInputTokens: 0,
    agentInferenceTimeMs: 0,
    totalPromptTokens: 0,
    totalCompletionTokens: 0,
    totalReasoningTokens: 0,
    totalCachedInputTokens: 0,
    totalInferenceTimeMs: 0,
  };

  constructor(opts: V3Options) {
    this.externalLogger = opts.logger;
    this.verbose = opts.verbose ?? 1;
    this.instanceId = uuidv7();
    this.sessionId = opts.sessionId ?? this.instanceId;
    this.keepAlive =
      opts.keepAlive ?? opts.browserbaseSessionCreateParams?.keepAlive;

    // Create per-instance StagehandLogger (handles usePino, verbose, externalLogger)
    // This gives each V3 instance independent logger configuration
    // while still sharing the underlying Pino worker thread via StagehandLogger.sharedPinoLogger
    const loggerOptions: LoggerOptions = {
      pretty: true,
      level: "info", // Most permissive - filtering happens at instance level
    };

    if (opts.disablePino !== undefined) {
      loggerOptions.usePino = !opts.disablePino;
    }

    this.stagehandLogger = new StagehandLogger(loggerOptions, opts.logger);
    this.stagehandLogger.setVerbosity(this.verbose);

    // Also bind to AsyncLocalStorage for v3Logger() calls from handlers
    // This maintains backward compatibility with code that uses v3Logger() directly
    try {
      if (this.externalLogger) {
        // Use external logger directly when provided
        bindInstanceLogger(this.instanceId, this.externalLogger);
      } else {
        // Fall back to stagehandLogger when no external logger
        bindInstanceLogger(this.instanceId, (line) => {
          this.stagehandLogger.log(line);
        });
      }
    } catch {
      // ignore
    }
    const { modelName, clientOptions } = resolveModelConfiguration(opts.model);
    this.modelName = modelName;
    this.experimental = opts.experimental ?? false;
    this.logInferenceToFile = opts.logInferenceToFile ?? false;
    this.llmProvider = new LLMProvider(this.logger);
    this.domSettleTimeoutMs = opts.domSettleTimeout;
    this.disableAPI = opts.disableAPI ?? false;

    const baseClientOptions: ClientOptions = clientOptions
      ? ({ ...clientOptions } as ClientOptions)
      : ({} as ClientOptions);
    if (opts.llmClient) {
      this.llmClient = opts.llmClient;
      this.modelClientOptions = baseClientOptions;
      this.disableAPI = true;
    } else {
      // Ensure API key is set
      let apiKey = (baseClientOptions as { apiKey?: string }).apiKey;
      if (!apiKey) {
        try {
          apiKey = loadApiKeyFromEnv(
            this.modelName.split("/")[0], // "openai", "anthropic", etc
            this.logger,
          );
        } catch (error) {
          this.logger({
            category: "init",
            message: `Error loading API key for model ${this.modelName}: ${error}. Continuing without LLM client.`,
            level: 0,
          });
          throw error;
        }
      }
      this.modelClientOptions = {
        ...baseClientOptions,
        apiKey,
      } as ClientOptions;

      // Get the default client for this model
      this.llmClient = this.llmProvider.getClient(
        this.modelName,
        this.modelClientOptions,
        { experimental: this.experimental, disableAPI: this.disableAPI },
      );
    }

    this.cacheStorage = CacheStorage.create(opts.cacheDir, this.logger, {
      label: "cache directory",
    });
    this.actCache = new ActCache({
      storage: this.cacheStorage,
      logger: this.logger,
      getActHandler: () => this.actHandler,
      getDefaultLlmClient: () => this.resolveLlmClient(),
      domSettleTimeoutMs: this.domSettleTimeoutMs,
    });
    this.agentCache = new AgentCache({
      storage: this.cacheStorage,
      logger: this.logger,
      getActHandler: () => this.actHandler,
      getContext: () => this.ctx,
      getDefaultLlmClient: () => this.resolveLlmClient(),
      getBaseModelName: () => this.modelName,
      getSystemPrompt: () => opts.systemPrompt,
      domSettleTimeoutMs: this.domSettleTimeoutMs,
      act: this.act.bind(this),
    });

    this.opts = opts;

    // FlowLogger always gets a per-instance session context and shared event
    // bus. The attached EventStore decides which sinks are active:
    // `BROWSERBASE_FLOW_LOGS=1` enables pretty stderr output,
    // and `BROWSERBASE_CONFIG_DIR` enables the pretty/jsonl file sinks for this session.
    this.eventStore = new EventStore(this.sessionId, opts);
    this.flowLoggerContext = FlowLogger.init(this.sessionId, this.bus);
    // Flow event pipeline:
    // FlowLogger -> this.bus -> this.eventStore -> configured sinks/query history.
    // V3 owns the bus for this session. EventStore is not another bus; it just
    // receives already-emitted FlowEvents here, then fans them out to sinks and
    // keeps the queryable per-session history used by /v4/log, parent/ancestor lookups, and tests.
    // `on()` stores a strong reference to the handler, so the EventStore
    // stays alive until this bus is garbage-collected with the rest of the V3
    // object graph.
    this.bus.on("*", this.eventStore.emit);

    // Track instance for global process guard handling
    V3._instances.add(this);
  }
  /**
   * Async property for metrics so callers can `await v3.metrics`.
   * When using API mode, fetches metrics from the API. Otherwise returns local metrics.
   */
  public get metrics(): Promise<StagehandMetrics> {
    if (this.apiClient) {
      // Fetch metrics from the API
      return this.apiClient.getReplayMetrics().catch((error) => {
        this.logger({
          category: "metrics",
          message: `Failed to fetch metrics from API: ${error}`,
          level: 0,
        });
        // Fall back to local metrics on error
        return this.stagehandMetrics;
      });
    }
    // Return local metrics wrapped in a Promise for consistency
    return Promise.resolve(this.stagehandMetrics);
  }

  private resolveLlmClient(model?: ModelConfiguration): LLMClient {
    if (!model) {
      return this.llmClient;
    }

    let modelName: AvailableModel | string;
    let clientOptions: ClientOptions | undefined;

    if (typeof model === "string") {
      modelName = model;
    } else {
      const { modelName: overrideModelName, ...rest } = model;
      modelName = overrideModelName;
      clientOptions = rest as ClientOptions;
    }

    if (
      modelName === this.modelName &&
      (!clientOptions || Object.keys(clientOptions).length === 0)
    ) {
      return this.llmClient;
    }

    const overrideProvider = String(modelName).split("/")[0];
    const baseProvider = String(this.modelName).split("/")[0];

    const mergedOptions = {
      ...(overrideProvider === baseProvider ? this.modelClientOptions : {}),
      ...(clientOptions ?? {}),
    } as ClientOptions;

    const providerKey = overrideProvider;
    if (!(mergedOptions as { apiKey?: string }).apiKey) {
      const apiKey = loadApiKeyFromEnv(providerKey, this.logger);
      if (apiKey) {
        (mergedOptions as { apiKey?: string }).apiKey = apiKey;
      }
    }

    const cacheKey = JSON.stringify({
      modelName,
      clientOptions: mergedOptions,
    });

    const cached = this.overrideLlmClients.get(cacheKey);
    if (cached) {
      return cached;
    }

    const client = this.llmProvider.getClient(
      modelName as AvailableModel,
      mergedOptions,
      { experimental: this.experimental, disableAPI: this.disableAPI },
    );

    this.overrideLlmClients.set(cacheKey, client);
    return client;
  }

  private beginAgentReplayRecording(): void {
    this.agentCache.beginRecording();
  }

  private endAgentReplayRecording(): AgentReplayStep[] {
    return this.agentCache.endRecording();
  }

  private discardAgentReplayRecording(): void {
    this.agentCache.discardRecording();
  }

  private isAgentReplayRecording(): boolean {
    return this.agentCache.isRecording();
  }

  public isAgentReplayActive(): boolean {
    return this.agentCache.isReplayActive();
  }

  public recordAgentReplayStep(step: AgentReplayStep): void {
    this.agentCache.recordStep(step);
  }

  /**
   * Async property for history so callers can `await v3.history`.
   * Returns a frozen copy to avoid external mutation.
   */
  public get history(): Promise<ReadonlyArray<HistoryEntry>> {
    return Promise.resolve(Object.freeze([...this._history]));
  }

  public addToHistory(
    method: HistoryEntry["method"],
    parameters: unknown,
    result?: unknown,
  ): void {
    this._history.push({
      method,
      parameters,
      result: result ?? null,
      timestamp: new Date().toISOString(),
    });
  }

  public updateMetrics(
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ): void {
    switch (functionName) {
      case V3FunctionName.ACT:
        this.stagehandMetrics.actPromptTokens += promptTokens;
        this.stagehandMetrics.actCompletionTokens += completionTokens;
        this.stagehandMetrics.actReasoningTokens += reasoningTokens;
        this.stagehandMetrics.actCachedInputTokens += cachedInputTokens;
        this.stagehandMetrics.actInferenceTimeMs += inferenceTimeMs;
        break;

      case V3FunctionName.EXTRACT:
        this.stagehandMetrics.extractPromptTokens += promptTokens;
        this.stagehandMetrics.extractCompletionTokens += completionTokens;
        this.stagehandMetrics.extractReasoningTokens += reasoningTokens;
        this.stagehandMetrics.extractCachedInputTokens += cachedInputTokens;
        this.stagehandMetrics.extractInferenceTimeMs += inferenceTimeMs;
        break;

      case V3FunctionName.OBSERVE:
        this.stagehandMetrics.observePromptTokens += promptTokens;
        this.stagehandMetrics.observeCompletionTokens += completionTokens;
        this.stagehandMetrics.observeReasoningTokens += reasoningTokens;
        this.stagehandMetrics.observeCachedInputTokens += cachedInputTokens;
        this.stagehandMetrics.observeInferenceTimeMs += inferenceTimeMs;
        break;

      case V3FunctionName.AGENT:
        this.stagehandMetrics.agentPromptTokens += promptTokens;
        this.stagehandMetrics.agentCompletionTokens += completionTokens;
        this.stagehandMetrics.agentReasoningTokens += reasoningTokens;
        this.stagehandMetrics.agentCachedInputTokens += cachedInputTokens;
        this.stagehandMetrics.agentInferenceTimeMs += inferenceTimeMs;
        break;
    }
    this.updateTotalMetrics(
      promptTokens,
      completionTokens,
      reasoningTokens,
      cachedInputTokens,
      inferenceTimeMs,
    );
  }

  private updateTotalMetrics(
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ): void {
    this.stagehandMetrics.totalPromptTokens += promptTokens;
    this.stagehandMetrics.totalCompletionTokens += completionTokens;
    this.stagehandMetrics.totalReasoningTokens += reasoningTokens;
    this.stagehandMetrics.totalCachedInputTokens += cachedInputTokens;
    this.stagehandMetrics.totalInferenceTimeMs += inferenceTimeMs;
  }

  private async _immediateShutdown(reason: string): Promise<void> {
    try {
      this.logger({
        category: "v3",
        message: `initiating shutdown → ${reason}`,
        level: 0,
      });
    } catch {
      //
    }

    try {
      this.logger({
        category: "v3",
        message: `closing resources → ${reason}`,
        level: 0,
      });
      await this.close({ force: true });
    } catch {
      // swallow — already shutting down
    }
  }

  /** Spawn a crash-only supervisor that cleans up when this process dies. */
  private startShutdownSupervisor(
    config: ShutdownSupervisorConfig,
  ): ShutdownSupervisorHandle | null {
    if (this.shutdownSupervisor) return this.shutdownSupervisor;
    this.shutdownSupervisor = startShutdownSupervisor(config, {
      onError: (error, context) => {
        try {
          this.logger({
            category: "v3",
            message:
              "Shutdown supervisor unavailable; crash cleanup disabled. " +
              "If this process exits unexpectedly, local Chrome or Browserbase " +
              "sessions may remain running even with keepAlive=false.",
            level: 0,
            auxiliary: {
              context: { value: context, type: "string" },
              error: { value: error.message, type: "string" },
            },
          });
        } catch {
          // ignore logging failures
        }
      },
    });
    return this.shutdownSupervisor;
  }

  /** Stop the supervisor during a normal shutdown. */
  private stopShutdownSupervisor(): void {
    if (!this.shutdownSupervisor) return;
    try {
      this.shutdownSupervisor.stop();
    } catch {
      // best-effort
    }
    this.shutdownSupervisor = null;
  }

  /**
   * Entrypoint: initializes handlers, launches Chrome or Browserbase,
   * and sets up a CDP context.
   */
  async init(): Promise<void> {
    try {
      return await withInstanceLogContext(this.instanceId, async () => {
        this.actHandler = new ActHandler(
          this.llmClient,
          this.modelName,
          this.modelClientOptions,
          (model) => this.resolveLlmClient(model),
          this.opts.systemPrompt ?? "",
          this.logInferenceToFile,
          this.opts.selfHeal ?? true,
          (
            functionName,
            promptTokens,
            completionTokens,
            reasoningTokens,
            cachedInputTokens,
            inferenceTimeMs,
          ) =>
            this.updateMetrics(
              functionName,
              promptTokens,
              completionTokens,
              reasoningTokens,
              cachedInputTokens,
              inferenceTimeMs,
            ),
          this.domSettleTimeoutMs,
        );
        this.extractHandler = new ExtractHandler(
          this.llmClient,
          this.modelName,
          this.modelClientOptions,
          (model) => this.resolveLlmClient(model),
          this.opts.systemPrompt ?? "",
          this.logInferenceToFile,
          this.experimental,
          (
            functionName,
            promptTokens,
            completionTokens,
            reasoningTokens,
            cachedInputTokens,
            inferenceTimeMs,
          ) =>
            this.updateMetrics(
              functionName,
              promptTokens,
              completionTokens,
              reasoningTokens,
              cachedInputTokens,
              inferenceTimeMs,
            ),
        );
        this.observeHandler = new ObserveHandler(
          this.llmClient,
          this.modelName,
          this.modelClientOptions,
          (model) => this.resolveLlmClient(model),
          this.opts.systemPrompt ?? "",
          this.logInferenceToFile,
          this.experimental,
          (
            functionName,
            promptTokens,
            completionTokens,
            reasoningTokens,
            cachedInputTokens,
            inferenceTimeMs,
          ) =>
            this.updateMetrics(
              functionName,
              promptTokens,
              completionTokens,
              reasoningTokens,
              cachedInputTokens,
              inferenceTimeMs,
            ),
        );
        if (this.opts.env === "LOCAL") {
          // chrome-launcher conditionally adds --headless when the environment variable
          // HEADLESS is set, without parsing its value.
          // if it is not equal to true, then we delete it from the process
          const envHeadless = process.env.HEADLESS;
          if (envHeadless !== undefined) {
            const normalized = envHeadless.trim().toLowerCase();
            if (normalized !== "true") {
              delete process.env.HEADLESS;
            }
          }
          const lbo: LocalBrowserLaunchOptions =
            this.opts.localBrowserLaunchOptions ?? {};

          if (lbo.cdpHeaders && !lbo.cdpUrl) {
            this.logger({
              category: "init",
              message:
                "`cdpHeaders` was provided but `cdpUrl` is not set — cdpHeaders will be ignored. Set `cdpUrl` to connect to an existing browser via CDP.",
              level: 2,
            });
          }

          // If a CDP URL is provided, attach instead of launching.
          if (lbo.cdpUrl) {
            this.logger({
              category: "init",
              message: "Connecting to local browser",
              level: 1,
            });
            this.ctx = await V3Context.create(lbo.cdpUrl, {
              env: "LOCAL",
              cdpHeaders: lbo.cdpHeaders,
            });
            this.ctx.conn.flowLoggerContext = this.flowLoggerContext;
            this.ctx.conn.onTransportClosed(this._onCdpClosed);
            this.state = {
              kind: "LOCAL",
              // no LaunchedChrome when attaching externally; create a stub kill
              chrome: {
                kill: async () => {},
              } as unknown as import("chrome-launcher").LaunchedChrome,
              ws: lbo.cdpUrl,
            };
            this.resetBrowserbaseSessionMetadata();
            // Post-connect settings (downloads and viewport) if provided
            await this._applyPostConnectLocalOptions(lbo);
            return;
          }
          this.logger({
            category: "init",
            message: "Launching local browser",
            level: 1,
          });

          // Determine or create user data dir
          let userDataDir = lbo.userDataDir;
          let createdTemp = false;
          if (!userDataDir) {
            const base = path.join(os.tmpdir(), "stagehand-v3");
            fs.mkdirSync(base, { recursive: true });
            userDataDir = fs.mkdtempSync(path.join(base, "profile-"));
            createdTemp = true;
          }

          // Build chrome flags
          const defaults = [
            "--remote-allow-origins=*",
            "--no-first-run",
            "--no-default-browser-check",
            "--disable-dev-shm-usage",
            "--site-per-process",
          ];
          let chromeFlags: string[];
          const ignore = lbo.ignoreDefaultArgs;
          if (ignore === true) {
            // drop defaults
            chromeFlags = [];
          } else if (Array.isArray(ignore)) {
            chromeFlags = defaults.filter(
              (f) => !ignore.some((ex) => f.includes(ex)),
            );
          } else {
            chromeFlags = [...defaults];
          }

          // headless handled by launchLocalChrome
          if (lbo.devtools) chromeFlags.push("--auto-open-devtools-for-tabs");
          if (lbo.locale) chromeFlags.push(`--lang=${lbo.locale}`);
          if (!lbo.viewport) {
            lbo.viewport = DEFAULT_VIEWPORT;
          }
          if (lbo.viewport?.width && lbo.viewport?.height) {
            chromeFlags.push(
              `--window-size=${lbo.viewport.width},${lbo.viewport.height + 87}`, // Added pixels to the window to account for the address bar
            );
          }
          if (typeof lbo.deviceScaleFactor === "number") {
            chromeFlags.push(
              `--force-device-scale-factor=${Math.max(0.1, lbo.deviceScaleFactor)}`,
            );
          }
          if (lbo.hasTouch) chromeFlags.push("--touch-events=enabled");
          if (lbo.ignoreHTTPSErrors)
            chromeFlags.push("--ignore-certificate-errors");
          if (lbo.proxy?.server)
            chromeFlags.push(`--proxy-server=${lbo.proxy.server}`);
          if (lbo.proxy?.bypass)
            chromeFlags.push(`--proxy-bypass-list=${lbo.proxy.bypass}`);

          // add user-supplied args last
          if (Array.isArray(lbo.args)) chromeFlags.push(...lbo.args);

          const keepAlive = this.keepAlive === true;
          const { ws, chrome } = await launchLocalChrome({
            chromePath: lbo.executablePath,
            chromeFlags,
            port: lbo.port,
            headless: lbo.headless,
            userDataDir,
            connectTimeoutMs: lbo.connectTimeoutMs,
            handleSIGINT: !keepAlive,
          });
          if (keepAlive) {
            try {
              chrome.process?.unref?.();
            } catch {
              // best-effort: avoid keeping the event loop alive
            }
          }
          this.ctx = await V3Context.create(ws, {
            env: "LOCAL",
            localBrowserLaunchOptions: lbo,
          });
          this.ctx.conn.flowLoggerContext = this.flowLoggerContext;
          this.ctx.conn.onTransportClosed(this._onCdpClosed);
          this.state = {
            kind: "LOCAL",
            chrome,
            ws,
            userDataDir,
            createdTempProfile: createdTemp,
            preserveUserDataDir: !!lbo.preserveUserDataDir,
          };
          this.resetBrowserbaseSessionMetadata();
          const chromePid = chrome.process?.pid ?? chrome.pid;
          if (!keepAlive && chromePid) {
            this.startShutdownSupervisor({
              kind: "LOCAL",
              pid: chromePid,
              userDataDir,
              createdTempProfile: createdTemp,
              preserveUserDataDir: !!lbo.preserveUserDataDir,
            });
          }

          // Post-connect settings (downloads and viewport) if provided
          await this._applyPostConnectLocalOptions(lbo);
          return;
        }

        if (this.opts.env === "BROWSERBASE") {
          const { apiKey, projectId } = this.requireBrowserbaseCreds();
          this.logger({
            category: "init",
            message: "Starting browserbase session",
            level: 1,
          });
          const baseSessionParams =
            this.opts.browserbaseSessionCreateParams ?? {};
          const resolvedKeepAlive = this.keepAlive;
          const keepAlive = this.keepAlive === true;
          let effectiveSessionParams = baseSessionParams;
          if (resolvedKeepAlive !== undefined) {
            effectiveSessionParams = {
              ...baseSessionParams,
              keepAlive: resolvedKeepAlive,
            };
          }
          if (!this.disableAPI && !this.experimental) {
            this.apiClient = new StagehandAPIClient({
              apiKey,
              projectId,
              logger: this.logger,
              serverCache: this.opts.serverCache,
            });
            const {
              projectId: overrideProjectId,
              browserSettings,
              userMetadata,
              ...restSessionParams
            } = effectiveSessionParams;
            const resolvedProjectId = overrideProjectId ?? projectId;
            const createSessionPayload = {
              ...(resolvedProjectId ? { projectId: resolvedProjectId } : {}),
              ...restSessionParams,
              browserSettings: {
                ...(browserSettings ?? {}),
                viewport: browserSettings?.viewport ?? {
                  width: 1288,
                  height: 711,
                },
              },
              userMetadata: {
                ...(userMetadata ?? {}),
                stagehand: "true",
              },
            };
            const { sessionId, available } = await this.apiClient.init({
              modelName: this.modelName,
              modelApiKey: this.modelClientOptions.apiKey,
              domSettleTimeoutMs: this.domSettleTimeoutMs,
              verbose: this.verbose,
              systemPrompt: this.opts.systemPrompt,
              selfHeal: this.opts.selfHeal,
              browserbaseSessionCreateParams: createSessionPayload,
              browserbaseSessionID: this.opts.browserbaseSessionID,
            });
            if (!available) {
              this.apiClient = null;
            }
            this.opts.browserbaseSessionID = sessionId;
          }
          const { ws, sessionId, bb } = await createBrowserbaseSession(
            apiKey,
            projectId,
            effectiveSessionParams,
            this.opts.browserbaseSessionID,
          );
          this.ctx = await V3Context.create(ws, {
            env: "BROWSERBASE",
            apiClient: this.apiClient,
          });
          this.ctx.conn.flowLoggerContext = this.flowLoggerContext;
          this.ctx.conn.onTransportClosed(this._onCdpClosed);
          this.state = { kind: "BROWSERBASE", sessionId, ws, bb };
          this.browserbaseSessionId = sessionId;
          if (!keepAlive && !this.disableAPI) {
            this.startShutdownSupervisor({
              kind: "STAGEHAND_API",
              sessionId,
              apiKey,
              projectId,
            });
          }

          await this._ensureBrowserbaseDownloadsEnabled();

          const resumed = !!this.opts.browserbaseSessionID;
          let debugUrl: string | undefined;
          try {
            const dbg = (await bb.sessions.debug(sessionId)) as unknown as {
              debuggerUrl?: string;
            };
            debugUrl = dbg?.debuggerUrl;
          } catch {
            // Ignore debug fetch failures; continue with sessionUrl only
          }
          const sessionUrl = `https://www.browserbase.com/sessions/${sessionId}`;
          this.browserbaseSessionUrl = sessionUrl;
          this.browserbaseDebugUrl = debugUrl;

          try {
            this.logger({
              category: "init",
              message: resumed
                ? this.apiClient
                  ? "Browserbase session started"
                  : "Browserbase session resumed"
                : "Browserbase session started",
              level: 1,
              auxiliary: {
                sessionUrl: { value: sessionUrl, type: "string" },
                ...(debugUrl && {
                  debugUrl: { value: debugUrl, type: "string" },
                }),
                sessionId: { value: sessionId, type: "string" },
              },
            });
          } catch {
            // best-effort logging — ignore failures
          }
          return;
        }

        const neverEnv: never = this.opts.env;
        throw new StagehandInitError(`Unsupported env: ${neverEnv}`);
      });
    } catch (error) {
      // Cleanup instanceLoggers map on init failure to prevent memory leak
      if (this.externalLogger) {
        try {
          unbindInstanceLogger(this.instanceId);
        } catch {
          // ignore cleanup errors
        }
      }
      throw error;
    }
  }

  /** Apply post-connect local browser options that require CDP. */
  private async _applyPostConnectLocalOptions(
    lbo: LocalBrowserLaunchOptions,
  ): Promise<void> {
    try {
      // Downloads behavior
      if (lbo.downloadsPath || lbo.acceptDownloads !== undefined) {
        const behavior = lbo.acceptDownloads === false ? "deny" : "allow";
        await this.ctx?.conn
          .send("Browser.setDownloadBehavior", {
            behavior,
            downloadPath: lbo.downloadsPath,
            eventsEnabled: true,
          })
          .catch(() => {});
      }
    } catch {
      // best-effort only
    }
  }

  private async _ensureBrowserbaseDownloadsEnabled(): Promise<void> {
    const conn = this.ctx?.conn;
    if (!conn) return;
    try {
      await conn.send("Browser.setDownloadBehavior", {
        behavior: "allow",
        downloadPath: "downloads",
        eventsEnabled: true,
      });
    } catch {
      // best-effort only
    }
  }

  private resetBrowserbaseSessionMetadata(): void {
    this.browserbaseSessionId = undefined;
    this.browserbaseSessionUrl = undefined;
    this.browserbaseDebugUrl = undefined;
  }

  /**
   * Run an "act" instruction through the ActHandler.
   *
   * New API:
   * - act(instruction: string, options?: ActOptions)
   * - act(action: Action, options?: ActOptions)
   */
  async act(instruction: string, options?: ActOptions): Promise<ActResult>;
  async act(action: Action, options?: ActOptions): Promise<ActResult>;

  @FlowLogger.wrapWithLogging({
    eventType: "StagehandAct",
  })
  async act(input: string | Action, options?: ActOptions): Promise<ActResult> {
    return await withInstanceLogContext(this.instanceId, async () => {
      if (!this.actHandler) throw new StagehandNotInitializedError("act()");

      let actResult: ActResult;

      if (isObserveResult(input)) {
        // Resolve page: use provided page if any, otherwise default active page
        const v3Page = await this.resolvePage(options?.page);

        // Use selector as provided to support XPath, CSS, and other engines
        const selector = input.selector;
        if (this.apiClient) {
          actResult = await this.apiClient.act({
            input,
            options,
            frameId: v3Page.mainFrameId(),
          });
        } else {
          const ensureTimeRemaining = createTimeoutGuard(
            options?.timeout,
            (ms) => new ActTimeoutError(ms),
          );
          actResult = await this.actHandler.takeDeterministicAction(
            { ...input, selector },
            v3Page,
            this.domSettleTimeoutMs,
            this.resolveLlmClient(options?.model),
            ensureTimeRemaining,
            options?.variables,
          );
        }

        // history: record ObserveResult-based act call
        this.addToHistory(
          "act",
          {
            observeResult: input,
          },
          actResult,
        );
        return actResult;
      }
      // instruction path
      if (typeof input !== "string" || !input.trim()) {
        throw new StagehandInvalidArgumentError(
          "act(): instruction string is required unless passing an Action",
        );
      }

      // Resolve page from options or default
      const page = await this.resolvePage(options?.page);
      const actCacheLlmClient = options?.model
        ? this.resolveLlmClient(options.model)
        : undefined;

      let actCacheContext: Awaited<
        ReturnType<typeof this.actCache.prepareContext>
      > | null = null;
      const canUseCache =
        typeof input === "string" &&
        !this.isAgentReplayRecording() &&
        this.actCache.enabled;
      if (canUseCache) {
        actCacheContext = await this.actCache.prepareContext(
          input,
          page,
          flattenVariables(options?.variables),
        );
        if (actCacheContext) {
          const cachedResult = await this.actCache.tryReplay(
            actCacheContext,
            page,
            options?.timeout,
            actCacheLlmClient,
          );
          if (cachedResult) {
            this.addToHistory(
              "act",
              {
                instruction: input,
                variables: options?.variables,
                timeout: options?.timeout,
                cacheHit: true,
              },
              cachedResult,
            );
            return cachedResult;
          }
        }
      }

      const handlerParams: ActHandlerParams = {
        instruction: input,
        page,
        variables: options?.variables,
        timeout: options?.timeout,
        model: options?.model,
      };
      if (this.apiClient) {
        const frameId = page.mainFrameId();
        actResult = await this.apiClient.act({ input, options, frameId });
      } else {
        actResult = await this.actHandler.act(handlerParams);
      }
      // history: record instruction-based act call (omit page object)
      this.addToHistory(
        "act",
        {
          instruction: input,
          variables: options?.variables,
          timeout: options?.timeout,
        },
        actResult,
      );

      if (
        actCacheContext &&
        actResult.success &&
        Array.isArray(actResult.actions) &&
        actResult.actions.length > 0
      ) {
        await this.actCache.store(actCacheContext, actResult);
      }
      return actResult;
    });
  }

  /**
   * Run an "extract" instruction through the ExtractHandler.
   *
   * Accepted forms:
   * - extract() → pageText
   * - extract(options) → pageText
   * - extract(instruction) → defaultExtractSchema
   * - extract(instruction, schema) → schema-inferred
   * - extract(instruction, schema, options)
   */

  async extract(): Promise<z.infer<typeof pageTextSchema>>;
  async extract(
    options: ExtractOptions,
  ): Promise<z.infer<typeof pageTextSchema>>;
  async extract(
    instruction: string,
    options?: ExtractOptions,
  ): Promise<z.infer<typeof defaultExtractSchema>>;
  async extract<T extends StagehandZodSchema>(
    instruction: string,
    schema: T,
    options?: ExtractOptions,
  ): Promise<InferStagehandSchema<T>>;

  @FlowLogger.wrapWithLogging({
    eventType: "StagehandExtract",
  })
  async extract(
    a?: string | ExtractOptions,
    b?: StagehandZodSchema | ExtractOptions,
    c?: ExtractOptions,
  ): Promise<unknown> {
    return await withInstanceLogContext(this.instanceId, async () => {
      if (!this.extractHandler) {
        throw new StagehandNotInitializedError("extract()");
      }

      // Normalize args
      let instruction: string | undefined;
      let schema: StagehandZodSchema | undefined;
      let options: ExtractOptions | undefined;

      if (typeof a === "string") {
        instruction = a;
        const isZodSchema = (val: unknown): val is StagehandZodSchema =>
          !!val &&
          typeof val === "object" &&
          "parse" in val &&
          "safeParse" in val;
        if (isZodSchema(b)) {
          schema = b as StagehandZodSchema;
          options = c as ExtractOptions | undefined;
        } else {
          options = b as ExtractOptions | undefined;
        }
      } else {
        // a is options or undefined
        options = (a as ExtractOptions) || undefined;
      }

      if (!instruction && schema) {
        throw new StagehandInvalidArgumentError(
          "extract(): schema provided without instruction",
        );
      }

      // If instruction without schema → defaultExtractSchema
      const effectiveSchema =
        instruction && !schema ? defaultExtractSchema : schema;

      // Resolve page from options or use active page
      const page = await this.resolvePage(options?.page);

      const handlerParams: ExtractHandlerParams<StagehandZodSchema> = {
        instruction,
        schema: effectiveSchema as StagehandZodSchema | undefined,
        model: options?.model,
        timeout: options?.timeout,
        selector: options?.selector,
        page,
      };
      let result: z.infer<typeof effectiveSchema> | { pageText: string };
      if (this.apiClient) {
        const frameId = page.mainFrameId();
        result = await this.apiClient.extract({
          instruction: handlerParams.instruction,
          schema: handlerParams.schema,
          options,
          frameId,
        });
      } else {
        result =
          await this.extractHandler.extract<StagehandZodSchema>(handlerParams);
      }
      const historySchemaDescriptor = effectiveSchema
        ? toJsonSchema(effectiveSchema)
        : undefined;
      this.addToHistory(
        "extract",
        {
          instruction,
          selector: options?.selector,
          timeout: options?.timeout,
          schema: historySchemaDescriptor,
        },
        result,
      );
      return result;
    });
  }

  /**
   * Run an "observe" instruction through the ObserveHandler.
   */
  async observe(): Promise<Action[]>;
  async observe(options: ObserveOptions): Promise<Action[]>;
  async observe(
    instruction: string,
    options?: ObserveOptions,
  ): Promise<Action[]>;
  @FlowLogger.wrapWithLogging({
    eventType: "StagehandObserve",
  })
  async observe(
    a?: string | ObserveOptions,
    b?: ObserveOptions,
  ): Promise<Action[]> {
    return await withInstanceLogContext(this.instanceId, async () => {
      if (!this.observeHandler) {
        throw new StagehandNotInitializedError("observe()");
      }

      // Normalize args
      let instruction: string | undefined;
      let options: ObserveOptions | undefined;
      if (typeof a === "string") {
        instruction = a;
        options = b;
      } else {
        options = a as ObserveOptions | undefined;
      }

      // Resolve to our internal Page type
      const page = await this.resolvePage(options?.page);

      const handlerParams: ObserveHandlerParams = {
        instruction,
        model: options?.model,
        timeout: options?.timeout,
        selector: options?.selector,
        page: page!,
      };

      let results: Action[];
      if (this.apiClient) {
        const frameId = page.mainFrameId();
        results = await this.apiClient.observe({
          instruction,
          options,
          frameId,
        });
      } else {
        results = await this.observeHandler.observe(handlerParams);
      }

      // history: record observe call (omit page object)
      this.addToHistory(
        "observe",
        {
          instruction,
          timeout: options?.timeout,
        },
        results,
      );
      return results;
    });
  }

  /** Return the browser-level CDP WebSocket endpoint. */
  connectURL(): string {
    if (this.state.kind === "UNINITIALIZED") {
      throw new StagehandNotInitializedError("connectURL()");
    }
    return this.state.ws;
  }

  /** Expose the current CDP-backed context. */
  public get context(): V3Context {
    return this.ctx;
  }

  /** Best-effort cleanup of context and launched resources. */
  async close(opts?: { force?: boolean }): Promise<void> {
    // If we're already closing and this isn't a forced close, no-op.
    if (this._isClosing && !opts?.force) return;
    this._isClosing = true;

    const keepAlive = this.keepAlive === true;

    // Unhook CDP transport close handler BEFORE ending the API session.
    // apiClient.end() can cause the hosted API to terminate the Browserbase
    // session, which closes the CDP WebSocket. If the handler is still
    // registered, _onCdpClosed fires and re-enters close() with force=true,
    // causing a double-close cascade.
    try {
      if (this.ctx?.conn && this._onCdpClosed) {
        this.ctx.conn.offTransportClosed?.(this._onCdpClosed);
      }
    } catch {
      // ignore
    }

    // End Browserbase session via API when keepAlive is not enabled
    if (!keepAlive && this.apiClient) {
      try {
        await this.apiClient.end();
      } catch {
        // best-effort cleanup
      }
    }

    try {
      // Close session file logger
      try {
        await FlowLogger.close(this.flowLoggerContext);
      } catch {
        // ignore
      }

      // Close CDP context
      try {
        await this.ctx?.close();
      } catch {
        // ignore
      }

      // Kill local Chrome and clean up temp profile when keepAlive is not enabled
      if (!keepAlive && this.state.kind === "LOCAL") {
        const localState = this.state;
        await cleanupLocalBrowser({
          killChrome: () => localState.chrome.kill(),
          userDataDir: localState.userDataDir,
          createdTempProfile: localState.createdTempProfile,
          preserveUserDataDir: localState.preserveUserDataDir,
        });
      }
    } finally {
      this.stopShutdownSupervisor();

      // Reset internal state
      this.state = { kind: "UNINITIALIZED" };
      this.ctx = null;
      this._isClosing = false;
      this.resetBrowserbaseSessionMetadata();
      try {
        unbindInstanceLogger(this.instanceId);
      } catch {
        // ignore
      }
      try {
        await this.eventStore.destroy();
      } catch {
        // ignore
      }
      try {
        this.bus.removeAllListeners();
      } catch {
        // ignore
      }
      this._history = [];
      this.actHandler = null;
      this.extractHandler = null;
      this.observeHandler = null;
      V3._instances.delete(this);
    }
  }

  /**
   * Resolves the Browserbase API key from options or environment variables.
   * Returns undefined if no key is found (does not throw).
   */
  public get browserbaseApiKey(): string | undefined {
    return this.opts.apiKey || process.env.BROWSERBASE_API_KEY;
  }

  /** Guard: ensure Browserbase credentials exist in options. */
  private requireBrowserbaseCreds(): {
    apiKey: string;
    projectId?: string;
  } {
    let { apiKey, projectId } = this.opts;

    // Fall back to environment variables if not explicitly provided
    if (!apiKey)
      apiKey = process.env.BROWSERBASE_API_KEY ?? process.env.BB_API_KEY;
    if (!projectId)
      projectId =
        process.env.BROWSERBASE_PROJECT_ID ?? process.env.BB_PROJECT_ID;

    if (!apiKey) {
      throw new MissingEnvironmentVariableError(
        "BROWSERBASE_API_KEY",
        "Browserbase",
      );
    }

    // Cache resolved values back into opts for consistency
    this.opts.apiKey = apiKey;
    if (projectId) this.opts.projectId = projectId;

    // Informational log
    this.logger({
      category: "init",
      message: "Using Browserbase credentials",
      level: 1,
    });

    return { apiKey, projectId };
  }

  public get logger(): (logLine: LogLine) => void {
    // Delegate to per-instance StagehandLogger
    // StagehandLogger handles: verbosity filtering, usePino selection, external logger routing
    // This provides per-instance configuration while maintaining shared Pino optimization
    return (logLine: LogLine) => {
      const line = { ...logLine, level: logLine.level ?? 1 };
      this.stagehandLogger.log(line);
    };
  }

  /**
   * Normalize a Playwright/Puppeteer page object into its top frame id,
   * so handlers can resolve it to a `Page` within our V3Context.
   */
  private async resolveTopFrameId(
    page: PlaywrightPage | PuppeteerPage | PatchrightPage,
  ): Promise<string> {
    if (this.isPlaywrightPage(page)) {
      const cdp = await page.context().newCDPSession(page);
      const { frameTree } = await cdp.send("Page.getFrameTree");
      return frameTree.frame.id;
    }

    if (this.isPatchrightPage(page)) {
      const cdp = await page.context().newCDPSession(page);
      const { frameTree } = await cdp.send("Page.getFrameTree");
      return frameTree.frame.id;
    }

    if (this.isPuppeteerPage(page)) {
      const cdp = await page.createCDPSession();
      const { frameTree } = await cdp.send("Page.getFrameTree");
      this.logger({
        category: "v3",
        message: "Puppeteer frame id",
        level: 2,
        auxiliary: { frameId: { value: frameTree.frame.id, type: "string" } },
      });
      return frameTree.frame.id;
    }

    throw new StagehandInvalidArgumentError(
      "Unsupported page object passed to V3.act()",
    );
  }

  private isPlaywrightPage(p: unknown): p is PlaywrightPage {
    return (
      typeof p === "object" &&
      p !== null &&
      typeof (p as PlaywrightPage).context === "function"
    );
  }

  private isPatchrightPage(p: unknown): p is PatchrightPage {
    return (
      typeof p === "object" &&
      p !== null &&
      typeof (p as PatchrightPage).context === "function"
    );
  }

  private isPuppeteerPage(p: unknown): p is PuppeteerPage {
    return (
      typeof p === "object" &&
      p !== null &&
      typeof (p as PuppeteerPage).target === "function"
    );
  }

  /** Resolve an external page reference or fall back to the active V3 page. */
  private async resolvePage(page?: AnyPage): Promise<Page> {
    if (page) {
      return await this.normalizeToV3Page(page);
    }
    const ctx = this.ctx;
    if (!ctx) {
      throw new StagehandNotInitializedError("resolvePage()");
    }
    return await ctx.awaitActivePage();
  }

  private async normalizeToV3Page(input: AnyPage): Promise<Page> {
    if (input instanceof (await import("./understudy/page.js")).Page) {
      return input as Page;
    }
    if (this.isPlaywrightPage(input)) {
      const frameId = await this.resolveTopFrameId(input);
      const page = this.ctx!.resolvePageByMainFrameId(frameId);
      if (!page)
        throw new StagehandInitError(
          "Failed to resolve V3 Page from Playwright page.",
        );
      return page;
    }
    if (this.isPatchrightPage(input)) {
      const frameId = await this.resolveTopFrameId(input);
      const page = this.ctx!.resolvePageByMainFrameId(frameId);
      if (!page)
        throw new StagehandInitError(
          "Failed to resolve V3 Page from Patchright page.",
        );
      return page;
    }
    if (this.isPuppeteerPage(input)) {
      const frameId = await this.resolveTopFrameId(input);
      const page = this.ctx!.resolvePageByMainFrameId(frameId);
      if (!page)
        throw new StagehandInitError(
          "Failed to resolve V3 Page from Puppeteer page.",
        );
      return page;
    }
    throw new StagehandInvalidArgumentError("Unsupported page object.");
  }

  private async _logBrowserbaseSessionStatus(): Promise<void> {
    if (this.state.kind !== "BROWSERBASE") {
      return;
    }

    try {
      const snapshot = (await this.state.bb.sessions.retrieve(
        this.state.sessionId,
      )) as { id?: string; status?: string };
      if (!snapshot?.status) return;

      const sessionId = snapshot.id ?? this.state.sessionId;
      const message =
        snapshot.status === "TIMED_OUT"
          ? `Browserbase session timed out (sessionId: ${sessionId})`
          : `Browserbase session status: ${snapshot.status}`;

      this.logger({
        category: "v3",
        message,
        level: 0,
      });
    } catch {
      // Ignore failures; nothing to log
    }
  }

  /**
   * Prepares shared context for agent execution (both execute and stream).
   * Extracts duplicated setup logic into a single helper.
   */
  private async prepareAgentExecution(
    options: AgentConfig | undefined,
    instructionOrOptions:
      | string
      | AgentExecuteOptions
      | AgentStreamExecuteOptions,
    agentConfigSignature: string,
  ): Promise<{
    handler: V3AgentHandler;
    resolvedOptions: AgentExecuteOptions | AgentStreamExecuteOptions;
    instruction: string;
    cacheContext: AgentCacheContext | null;
    llmClient: LLMClient;
  }> {
    // Note: experimental validation is done at the call site before this method
    // Warn if mode is not explicitly set (defaults to "dom")
    if (options?.mode === undefined) {
      this.logger({
        category: "agent",
        message:
          "Using agent in default DOM mode (legacy). Agent will default to 'hybrid' on an upcoming release for improved performance.\n  → https://docs.stagehand.dev/v3/basics/agent\n",
        level: 0,
      });
    }

    const tools = options?.integrations
      ? await resolveTools(options.integrations, options.tools)
      : (options?.tools ?? {});

    const agentLlmClient = options?.model
      ? this.resolveLlmClient(options.model)
      : this.llmClient;

    const resolvedExecutionModel = options?.executionModel ?? options?.model;

    const handler = new V3AgentHandler(
      this,
      this.logger,
      agentLlmClient,
      resolvedExecutionModel,
      options?.systemPrompt,
      tools,
      options?.mode,
      this.isCaptchaAutoSolveEnabled,
    );

    const resolvedOptions: AgentExecuteOptions | AgentStreamExecuteOptions =
      typeof instructionOrOptions === "string"
        ? {
            instruction: instructionOrOptions,
            toolTimeout: DEFAULT_AGENT_TOOL_TIMEOUT_MS,
          }
        : {
            ...instructionOrOptions,
            toolTimeout:
              instructionOrOptions.toolTimeout ?? DEFAULT_AGENT_TOOL_TIMEOUT_MS,
          };

    const callbacksWithSafety = resolvedOptions.callbacks as
      | AgentExecuteCallbacks
      | undefined;
    if (callbacksWithSafety?.onSafetyConfirmation) {
      throw new StagehandInvalidArgumentError(
        'onSafetyConfirmation callback is only supported when using mode: "cua" agents.',
      );
    }

    if (resolvedOptions.page) {
      const normalizedPage = await this.normalizeToV3Page(resolvedOptions.page);
      this.ctx!.setActivePage(normalizedPage);
    }

    const instruction = resolvedOptions.instruction.trim();
    const sanitizedOptions =
      this.agentCache.sanitizeExecuteOptions(resolvedOptions);

    const cacheVariables = flattenVariables(resolvedOptions.variables);

    const cacheContext = this.agentCache.shouldAttemptCache(instruction)
      ? await this.agentCache.prepareContext({
          instruction,
          options: sanitizedOptions,
          configSignature: agentConfigSignature,
          page: await this.ctx!.awaitActivePage(),
          variables: cacheVariables,
        })
      : null;

    return {
      handler,
      resolvedOptions,
      instruction,
      cacheContext,
      llmClient: agentLlmClient,
    };
  }

  /**
   * Create a v3 agent instance (AISDK tool-based) with execute().
   * Mirrors the v2 Stagehand.agent() tool mode (no CUA provider here).
   *
   * @overload When stream: true, returns a streaming agent where execute() returns AgentStreamResult
   * @overload When stream is false/undefined, returns a non-streaming agent where execute() returns AgentResult
   */
  agent(options: AgentConfig & { stream: true }): {
    execute: (
      instructionOrOptions: string | AgentStreamExecuteOptions,
    ) => Promise<AgentStreamResult>;
  };
  agent(options?: AgentConfig & { stream?: false }): {
    execute: (
      instructionOrOptions: string | AgentExecuteOptions,
    ) => Promise<AgentResult>;
  };
  agent(options?: AgentConfig): {
    execute: (
      instructionOrOptions:
        | string
        | AgentExecuteOptions
        | AgentStreamExecuteOptions,
    ) => Promise<AgentResult | AgentStreamResult>;
  } {
    // Determine if CUA mode is enabled (via mode: "cua" or deprecated cua: true)
    const isCuaMode =
      options?.mode !== undefined
        ? options.mode === "cua"
        : options?.cua === true;

    // Emit deprecation warning for cua: true
    if (options?.cua === true) {
      this.logger({
        category: "agent",
        message:
          '[DEPRECATED] The "cua: true" option is deprecated. Use "mode: \'cua\'" instead. This option will be removed in a future version.',
        level: 0,
      });
      console.warn(
        '[Stagehand] DEPRECATED: The "cua: true" option is deprecated. Use "mode: \'cua\'" instead.',
      );
    }

    this.logger({
      category: "agent",
      message: "Creating v3 agent instance",
      level: 1,
      auxiliary: {
        cua: { value: isCuaMode ? "true" : "false", type: "boolean" },
        mode: { value: options?.mode ?? "dom", type: "string" },
        model: {
          value: extractModelName(options?.model) ?? this.llmClient.modelName,
          type: "string",
        },
        systemPrompt: { value: options?.systemPrompt ?? "", type: "string" },
        tools: { value: JSON.stringify(options?.tools ?? {}), type: "object" },
        ...(options?.integrations && {
          integrations: {
            value: JSON.stringify(options.integrations),
            type: "object",
          },
        }),
      },
    });

    // If CUA mode is enabled (via mode: "cua" or deprecated cua: true), use the computer-use agent path
    if (isCuaMode) {
      // Validate agent config at creation time (includes CUA+streaming conflict check)
      validateExperimentalFeatures({
        isExperimental: this.experimental,
        agentConfig: options,
      });

      const modelToUse = options?.model || {
        modelName: this.modelName,
        ...this.modelClientOptions,
      };

      const { modelName, isCua, clientOptions } = resolveModel(modelToUse);

      if (!isCua) {
        throw new CuaModelRequiredError(AVAILABLE_CUA_MODELS);
      }

      const agentConfigSignature =
        this.agentCache.buildConfigSignature(options);
      const execute = async (
        instructionOrOptions: string | AgentExecuteOptions,
      ): Promise<AgentResult> =>
        withInstanceLogContext(
          this.instanceId,
          async (): Promise<AgentResult> => {
            validateExperimentalFeatures({
              isExperimental: this.experimental,
              agentConfig: options,
              executeOptions:
                typeof instructionOrOptions === "object"
                  ? instructionOrOptions
                  : null,
            });

            const tools = options?.integrations
              ? await resolveTools(options.integrations, options.tools)
              : (options?.tools ?? {});

            const handler = new V3CuaAgentHandler(
              this,
              this.logger,
              {
                modelName,
                clientOptions,
                userProvidedInstructions:
                  (options.systemPrompt ??
                    `You are a helpful assistant that can use a web browser.\nDo not ask follow up questions, the user will trust your judgement.`) +
                  (this.isCaptchaAutoSolveEnabled
                    ? CAPTCHA_CUA_SYSTEM_PROMPT_NOTE
                    : ""),
              },
              tools,
            );

            const resolvedOptions: AgentExecuteOptions =
              typeof instructionOrOptions === "string"
                ? {
                    instruction: instructionOrOptions,
                    toolTimeout: DEFAULT_AGENT_TOOL_TIMEOUT_MS,
                  }
                : {
                    ...instructionOrOptions,
                    toolTimeout:
                      instructionOrOptions.toolTimeout ??
                      DEFAULT_AGENT_TOOL_TIMEOUT_MS,
                  };
            if (resolvedOptions.page) {
              const normalizedPage = await this.normalizeToV3Page(
                resolvedOptions.page,
              );
              this.ctx!.setActivePage(normalizedPage);
            }
            const instruction = resolvedOptions.instruction.trim();
            const sanitizedOptions =
              this.agentCache.sanitizeExecuteOptions(resolvedOptions);

            const cacheVariables = flattenVariables(resolvedOptions.variables);

            let cacheContext: AgentCacheContext | null = null;
            if (this.agentCache.shouldAttemptCache(instruction)) {
              const startPage = await this.ctx!.awaitActivePage();
              cacheContext = await this.agentCache.prepareContext({
                instruction,
                options: sanitizedOptions,
                configSignature: agentConfigSignature,
                page: startPage,
                variables: cacheVariables,
              });
              if (cacheContext) {
                const replayed = await this.agentCache.tryReplay(cacheContext);
                if (replayed) {
                  return replayed;
                }
              }
            }

            let agentSteps: AgentReplayStep[] = [];
            const shouldRecordLocally =
              !!cacheContext && (!this.apiClient || this.experimental);
            if (shouldRecordLocally) {
              this.beginAgentReplayRecording();
            }

            let result: AgentResult;
            try {
              if (this.apiClient && !this.experimental) {
                const page = await this.ctx!.awaitActivePage();
                result = await this.apiClient.agentExecute(
                  options,
                  resolvedOptions,
                  page.mainFrameId(),
                  !!cacheContext,
                );
                if (cacheContext) {
                  const transferredEntry =
                    this.apiClient.consumeLatestAgentCacheEntry();
                  await this.agentCache.storeTransferredEntry(transferredEntry);
                }
              } else {
                result = await handler.execute(instructionOrOptions);
              }
              if (shouldRecordLocally) {
                agentSteps = this.endAgentReplayRecording();
              }

              if (
                shouldRecordLocally &&
                cacheContext &&
                result.success &&
                agentSteps.length > 0
              ) {
                await this.agentCache.store(cacheContext, agentSteps, result);
              }

              return result;
            } catch (err) {
              if (shouldRecordLocally) this.discardAgentReplayRecording();
              throw err;
            } finally {
              if (shouldRecordLocally) {
                this.discardAgentReplayRecording();
              }
            }
          },
        );
      return {
        execute: FlowLogger.wrapWithLogging({
          eventType: "AgentExecute",
          context: this.flowLoggerContext,
        })(execute),
      };
    }

    // Default: AISDK tools-based agent
    const agentConfigSignature = this.agentCache.buildConfigSignature(options);
    const isStreaming = options?.stream ?? false;
    const execute = async (
      instructionOrOptions:
        | string
        | AgentExecuteOptions
        | AgentStreamExecuteOptions,
    ): Promise<AgentResult | AgentStreamResult> =>
      withInstanceLogContext(
        this.instanceId,
        async (): Promise<AgentResult | AgentStreamResult> => {
          validateExperimentalFeatures({
            isExperimental: this.experimental,
            agentConfig: options,
            executeOptions:
              typeof instructionOrOptions === "object"
                ? instructionOrOptions
                : null,
            isStreaming,
          });

          // Streaming mode
          if (isStreaming) {
            const { handler, resolvedOptions, cacheContext, llmClient } =
              await this.prepareAgentExecution(
                options,
                instructionOrOptions,
                agentConfigSignature,
              );

            if (cacheContext) {
              const replayed = await this.agentCache.tryReplayAsStream(
                cacheContext,
                llmClient,
              );
              if (replayed) {
                return replayed;
              }
            }

            const streamResult = await handler.stream(
              resolvedOptions as AgentStreamExecuteOptions,
            );

            if (cacheContext) {
              const wrappedStream = this.agentCache.wrapStreamForCaching(
                cacheContext,
                streamResult,
                () => this.beginAgentReplayRecording(),
                () => this.endAgentReplayRecording(),
                () => this.discardAgentReplayRecording(),
              );
              return wrappedStream;
            }

            return streamResult;
          }

          // Non-streaming mode (default)
          const { handler, resolvedOptions, cacheContext, llmClient } =
            await this.prepareAgentExecution(
              options,
              instructionOrOptions,
              agentConfigSignature,
            );

          if (cacheContext) {
            const replayed = await this.agentCache.tryReplay(
              cacheContext,
              llmClient,
            );
            if (replayed) {
              return replayed;
            }
          }

          let agentSteps: AgentReplayStep[] = [];
          const shouldRecordLocally =
            !!cacheContext && (!this.apiClient || this.experimental);
          if (shouldRecordLocally) {
            this.beginAgentReplayRecording();
          }
          let result: AgentResult;

          try {
            if (this.apiClient && !this.experimental) {
              const page = await this.ctx!.awaitActivePage();
              result = await this.apiClient.agentExecute(
                options ?? {},
                resolvedOptions as AgentExecuteOptions,
                page.mainFrameId(),
                !!cacheContext,
              );
              if (cacheContext) {
                const transferredEntry =
                  this.apiClient.consumeLatestAgentCacheEntry();
                await this.agentCache.storeTransferredEntry(transferredEntry);
              }
            } else {
              result = await handler.execute(
                resolvedOptions as AgentExecuteOptions,
              );
            }
            if (shouldRecordLocally) {
              agentSteps = this.endAgentReplayRecording();
            }

            if (
              shouldRecordLocally &&
              cacheContext &&
              result.success &&
              agentSteps.length > 0
            ) {
              await this.agentCache.store(cacheContext, agentSteps, result);
            }

            return result;
          } catch (err) {
            if (shouldRecordLocally) this.discardAgentReplayRecording();
            throw err;
          } finally {
            if (shouldRecordLocally) {
              this.discardAgentReplayRecording();
            }
          }
        },
      );
    return {
      execute: FlowLogger.wrapWithLogging({
        eventType: "AgentExecute",
        context: this.flowLoggerContext,
      })(execute),
    };
  }
}

function isObserveResult(v: unknown): v is Action {
  return (
    !!v && typeof v === "object" && "selector" in (v as Record<string, unknown>)
  );
}


================================================
FILE: packages/core/lib/v3/zodCompat.ts
================================================
import { z } from "zod";
import type {
  ZodObject as Zod4Object,
  ZodRawShape as Zod4RawShape,
  ZodTypeAny as Zod4TypeAny,
} from "zod";
import zodToJsonSchema from "zod-to-json-schema";
import type * as z3 from "zod/v3";
export type StagehandZodSchema = Zod4TypeAny | z3.ZodTypeAny;

export type StagehandZodObject =
  | Zod4Object<Zod4RawShape>
  | z3.ZodObject<z3.ZodRawShape>;

export type InferStagehandSchema<T extends StagehandZodSchema> =
  T extends z3.ZodTypeAny
    ? z3.infer<T>
    : T extends Zod4TypeAny
      ? z.infer<T>
      : never;

export const isZod4Schema = (
  schema: StagehandZodSchema,
): schema is Zod4TypeAny & { _zod: unknown } =>
  typeof (schema as { _zod?: unknown })._zod !== "undefined";

export const isZod3Schema = (
  schema: StagehandZodSchema,
): schema is z3.ZodTypeAny => !isZod4Schema(schema);

export type JsonSchemaDocument = Record<string, unknown>;

export function toJsonSchema(schema: StagehandZodSchema): JsonSchemaDocument {
  if (!isZod4Schema(schema)) {
    return zodToJsonSchema(schema);
  }

  // For v4 schemas, use built-in z.toJSONSchema() method
  const zodWithJsonSchema = z as typeof z & {
    toJSONSchema?: (schema: Zod4TypeAny) => JsonSchemaDocument;
  };

  if (zodWithJsonSchema.toJSONSchema) {
    return zodWithJsonSchema.toJSONSchema(schema as Zod4TypeAny);
  }

  // This should never happen with Zod v4.1+
  throw new Error("Zod v4 toJSONSchema method not found");
}


================================================
FILE: packages/core/lib/v3Evaluator.ts
================================================
/**
 * V3Evaluator mirrors Evaluator but operates on a V3 instance instead of Stagehand.
 * It uses the V3 page/screenshot APIs and constructs an LLM client to run
 * structured evaluations (YES/NO with reasoning) on screenshots and/or text.
 */

import { z } from "zod";
import type { AvailableModel, ClientOptions } from "./v3/types/public/model.js";
import type {
  EvaluateOptions,
  BatchAskOptions,
  EvaluationResult,
} from "./v3/types/private/evaluator.js";
import { LLMParsedResponse } from "./inference.js";
import { LLMResponse, LLMClient } from "./v3/llm/LLMClient.js";
import { LogLine } from "./v3/types/public/logs.js";
import { V3 } from "./v3/v3.js";
import { LLMProvider } from "./v3/llm/LLMProvider.js";
import { StagehandInvalidArgumentError } from "./v3/types/public/sdkErrors.js";

const EvaluationSchema = z.object({
  evaluation: z.enum(["YES", "NO"]),
  reasoning: z.string(),
});

const BatchEvaluationSchema = z.array(EvaluationSchema);

export class V3Evaluator {
  private v3: V3;
  private modelName: AvailableModel;
  private modelClientOptions: ClientOptions | { apiKey: string };
  private silentLogger: (message: LogLine) => void = () => {};

  constructor(
    v3: V3,
    modelName?: AvailableModel,
    modelClientOptions?: ClientOptions,
  ) {
    this.v3 = v3;
    this.modelName = modelName || ("google/gemini-2.5-flash" as AvailableModel);
    this.modelClientOptions = modelClientOptions || {
      apiKey:
        process.env.GEMINI_API_KEY ||
        process.env.GOOGLE_GENERATIVE_AI_API_KEY ||
        "",
    };
  }

  private getClient(): LLMClient {
    // Prefer a dedicated provider so we can override model per-evaluation
    const provider = new LLMProvider(this.v3.logger);
    return provider.getClient(this.modelName, this.modelClientOptions);
  }

  async ask(options: EvaluateOptions): Promise<EvaluationResult> {
    const {
      question,
      answer,
      screenshot = true,
      systemPrompt,
      screenshotDelayMs = 250,
      agentReasoning,
    } = options;
    if (!question)
      throw new StagehandInvalidArgumentError(
        "Question cannot be an empty string",
      );
    if (!answer && !screenshot)
      throw new StagehandInvalidArgumentError(
        "Either answer (text) or screenshot must be provided",
      );

    if (Array.isArray(screenshot)) {
      return this._evaluateWithMultipleScreenshots({
        question,
        screenshots: screenshot,
        systemPrompt,
        agentReasoning,
      });
    }

    const defaultSystemPrompt = `You are an expert evaluator that confidently returns YES or NO based on if the original goal was achieved. You have access to  ${screenshot ? "a screenshot" : "the agents reasoning and actions throughout the task"} that you can use to evaluate the tasks completion. Provide detailed reasoning for your answer.\n          Today's date is ${new Date().toLocaleDateString()}`;

    await new Promise((r) => setTimeout(r, screenshotDelayMs));
    let imageBuffer: Buffer | undefined;
    if (screenshot) {
      const page = await this.v3.context.awaitActivePage();
      imageBuffer = await page.screenshot({ fullPage: false });
    }

    const llmClient = this.getClient();

    const response = await llmClient.createChatCompletion<
      LLMParsedResponse<LLMResponse>
    >({
      logger: this.silentLogger,
      options: {
        messages: [
          { role: "system", content: systemPrompt || defaultSystemPrompt },
          {
            role: "user",
            content: [
              {
                type: "text",
                text: agentReasoning
                  ? `Question: ${question}\n\nAgent's reasoning and actions taken:\n${agentReasoning}`
                  : question,
              },
              ...(screenshot && imageBuffer
                ? [
                    {
                      type: "image_url" as const,
                      image_url: {
                        url: `data:image/jpeg;base64,${imageBuffer.toString("base64")}`,
                      },
                    },
                  ]
                : []),
              ...(answer
                ? [{ type: "text" as const, text: `the answer is ${answer}` }]
                : []),
            ],
          },
        ],
        response_model: { name: "EvaluationResult", schema: EvaluationSchema },
      },
    });

    try {
      const result = response.data as unknown as z.infer<
        typeof EvaluationSchema
      >;
      return { evaluation: result.evaluation, reasoning: result.reasoning };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      return {
        evaluation: "INVALID",
        reasoning: `Failed to get structured response: ${errorMessage}`,
      } as const;
    }
  }

  async batchAsk(options: BatchAskOptions): Promise<EvaluationResult[]> {
    const {
      questions,
      screenshot = true,
      systemPrompt = "You are an expert evaluator that returns YES or NO with a concise reasoning.",
      screenshotDelayMs = 250,
    } = options;
    if (!questions?.length)
      throw new StagehandInvalidArgumentError(
        "Questions array cannot be empty",
      );

    await new Promise((r) => setTimeout(r, screenshotDelayMs));
    let imageBuffer: Buffer | undefined;
    if (screenshot) {
      const page = await this.v3.context.awaitActivePage();
      imageBuffer = await page.screenshot({ fullPage: false });
    }

    const llmClient = this.getClient();

    const formatted = questions
      .map(
        (item, i) =>
          `${i + 1}. ${item.question}${item.answer ? `\n   Answer: ${item.answer}` : ""}`,
      )
      .join("\n\n");

    const response = await llmClient.createChatCompletion<
      LLMParsedResponse<LLMResponse>
    >({
      logger: this.silentLogger,
      options: {
        messages: [
          {
            role: "system",
            content: `${systemPrompt}\n\nYou will be given multiple questions${screenshot ? " with a screenshot" : ""}. ${questions.some((q) => q.answer) ? "Some questions include answers to evaluate." : ""} Answer each question by returning an object in the specified JSON format. Return a single JSON array containing one object for each question in the order they were asked.`,
          },
          {
            role: "user",
            content: [
              { type: "text", text: formatted },
              ...(screenshot && imageBuffer
                ? [
                    {
                      type: "image_url" as const,
                      image_url: {
                        url: `data:image/jpeg;base64,${imageBuffer.toString("base64")}`,
                      },
                    },
                  ]
                : []),
            ],
          },
        ],
        response_model: {
          name: "BatchEvaluationResult",
          schema: BatchEvaluationSchema,
        },
      },
    });

    try {
      const results = response.data as unknown as z.infer<
        typeof BatchEvaluationSchema
      >;
      return results.map((r) => ({
        evaluation: r.evaluation,
        reasoning: r.reasoning,
      }));
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      return questions.map(() => ({
        evaluation: "INVALID" as const,
        reasoning: `Failed to get structured response: ${errorMessage}`,
      }));
    }
  }

  private async _evaluateWithMultipleScreenshots(options: {
    question: string;
    screenshots: Buffer[];
    systemPrompt?: string;
    agentReasoning?: string;
  }): Promise<EvaluationResult> {
    const {
      question,
      screenshots,
      agentReasoning,
      systemPrompt = `You are an expert evaluator that confidently returns YES or NO given a question and multiple screenshots showing the progression of a task.
        ${agentReasoning ? "You also have access to the agent's detailed reasoning and thought process throughout the task." : ""}
        Analyze ALL screenshots to understand the complete journey. Look for evidence of task completion across all screenshots, not just the last one.
        Success criteria may appear at different points in the sequence (confirmation messages, intermediate states, etc).
        ${agentReasoning ? "The agent's reasoning provides crucial context about what actions were attempted, what was observed, and the decision-making process. Use this alongside the visual evidence to make a comprehensive evaluation." : ""}
        Today's date is ${new Date().toLocaleDateString()}`,
    } = options;

    if (!question)
      throw new StagehandInvalidArgumentError(
        "Question cannot be an empty string",
      );
    if (!screenshots || screenshots.length === 0)
      throw new StagehandInvalidArgumentError(
        "At least one screenshot must be provided",
      );

    const llmClient = this.getClient();

    const imageContents = screenshots.map((s) => ({
      type: "image_url" as const,
      image_url: { url: `data:image/jpeg;base64,${s.toString("base64")}` },
    }));

    const response = await llmClient.createChatCompletion<
      LLMParsedResponse<LLMResponse>
    >({
      logger: this.silentLogger,
      options: {
        messages: [
          { role: "system", content: systemPrompt },
          {
            role: "user",
            content: [
              {
                type: "text",
                text: agentReasoning
                  ? `Question: ${question}\n\nAgent's reasoning and actions throughout the task:\n${agentReasoning}\n\nI'm providing ${screenshots.length} screenshots showing the progression of the task. Please analyze both the agent's reasoning and all screenshots to determine if the task was completed successfully.`
                  : `${question}\n\nI'm providing ${screenshots.length} screenshots showing the progression of the task. Please analyze all of them to determine if the task was completed successfully.`,
              },
              ...imageContents,
            ],
          },
        ],
        response_model: { name: "EvaluationResult", schema: EvaluationSchema },
      },
    });

    try {
      const result = response.data as unknown as z.infer<
        typeof EvaluationSchema
      >;
      return { evaluation: result.evaluation, reasoning: result.reasoning };
    } catch (error) {
      const errorMessage =
        error instanceof Error ? error.message : String(error);
      return {
        evaluation: "INVALID",
        reasoning: `Failed to get structured response: ${errorMessage}`,
      } as const;
    }
  }
}


================================================
FILE: packages/core/package.json
================================================
{
  "name": "@browserbasehq/stagehand",
  "version": "3.2.0",
  "description": "An AI web browsing framework focused on simplicity and extensibility.",
  "type": "module",
  "main": "./dist/cjs/index.js",
  "module": "./dist/esm/index.js",
  "types": "./dist/esm/index.d.ts",
  "exports": {
    ".": {
      "types": "./dist/esm/index.d.ts",
      "import": "./dist/esm/index.js",
      "require": "./dist/cjs/index.js"
    },
    "./cli": {
      "types": "./dist/esm/lib/v3/cli.d.ts",
      "import": "./dist/esm/lib/v3/cli.js",
      "require": "./dist/cjs/cli.js"
    },
    "./*.js": {
      "types": "./dist/esm/*.d.ts",
      "import": "./dist/esm/*.js"
    },
    "./*": {
      "types": "./dist/esm/*.d.ts",
      "import": "./dist/esm/*.js"
    },
    "./package.json": "./package.json"
  },
  "engines": {
    "node": "^20.19.0 || >=22.12.0"
  },
  "scripts": {
    "gen-version": "tsx scripts/gen-version.ts",
    "build-dom-scripts": "pnpm run --parallel \"/^build-dom-scripts:(dom|locator|screenshot|a11y)$/\"",
    "build-dom-scripts:dom": "tsx lib/v3/dom/genDomScripts.ts",
    "build-dom-scripts:locator": "tsx lib/v3/dom/genLocatorScripts.ts",
    "build-dom-scripts:screenshot": "tsx lib/v3/dom/genScreenshotScripts.ts",
    "build-dom-scripts:a11y": "tsx lib/v3/dom/genA11yScripts.ts",
    "build:cjs": "tsx scripts/build-cjs.ts",
    "build:esm": "tsx scripts/build-esm.ts",
    "build": "pnpm --filter @browserbasehq/stagehand run --parallel \"/^build:(esm|cjs)$/\"",
    "example": "node --import tsx -e \"const args=process.argv.slice(1).filter(a=>a!=='--'); const [p]=args; const n=(p||'example').replace(/^\\.\\//,'').replace(/\\.ts$/i,''); import('node:path').then(path=>import(new URL(path.resolve('examples', n + '.ts'), 'file:')));\" --",
    "test": "pnpm -w --dir ../.. exec turbo run test:core test:e2e --filter=@browserbasehq/stagehand --",
    "test:core": "tsx scripts/test-core.ts",
    "test:e2e": "tsx scripts/test-e2e.ts",
    "format": "prettier --write .",
    "typecheck": "pnpm -w --dir ../.. exec tsc -p packages/core/tsconfig.json --noEmit",
    "eslint": "eslint .",
    "lint": "cd ../.. && prettier --check packages/core && cd packages/core && pnpm run eslint && pnpm run typecheck"
  },
  "files": [
    "dist/esm",
    "dist/cjs"
  ],
  "keywords": [
    "ai",
    "browser",
    "automation",
    "web-scraping",
    "testing"
  ],
  "author": "Browserbase",
  "license": "MIT",
  "peerDependencies": {
    "deepmerge": "^4.3.1",
    "zod": "^3.25.76 || ^4.2.0"
  },
  "dependencies": {
    "@ai-sdk/provider": "^2.0.0",
    "@anthropic-ai/sdk": "0.39.0",
    "@browserbasehq/sdk": "^2.7.0",
    "@google/genai": "^1.22.0",
    "@langchain/openai": "^0.4.4",
    "@modelcontextprotocol/sdk": "^1.17.2",
    "ai": "^5.0.133",
    "devtools-protocol": "^0.0.1464554",
    "fetch-cookie": "^3.1.0",
    "openai": "^4.87.1",
    "pino": "^9.6.0",
    "pino-pretty": "^13.0.0",
    "uuid": "^11.1.0",
    "ws": "^8.18.0",
    "zod-to-json-schema": "^3.25.0"
  },
  "optionalDependencies": {
    "@ai-sdk/amazon-bedrock": "^3.0.73",
    "@ai-sdk/anthropic": "^2.0.34",
    "@ai-sdk/azure": "^2.0.54",
    "@ai-sdk/cerebras": "^1.0.25",
    "@ai-sdk/deepseek": "^1.0.23",
    "@ai-sdk/google": "^2.0.53",
    "@ai-sdk/google-vertex": "^3.0.70",
    "@ai-sdk/groq": "^2.0.24",
    "@ai-sdk/mistral": "^2.0.19",
    "@ai-sdk/openai": "^2.0.53",
    "@ai-sdk/perplexity": "^2.0.13",
    "@ai-sdk/togetherai": "^1.0.23",
    "@ai-sdk/xai": "^2.0.26",
    "@langchain/core": "^0.3.80",
    "bufferutil": "^4.0.9",
    "chrome-launcher": "^1.2.0",
    "ollama-ai-provider-v2": "^1.5.0",
    "patchright-core": "^1.55.2",
    "playwright": "^1.52.0",
    "playwright-core": "^1.54.1",
    "puppeteer-core": "^22.8.0"
  },
  "devDependencies": {
    "@playwright/test": "^1.42.1",
    "@types/adm-zip": "^0.5.7",
    "@types/jsdom": "^27.0.0",
    "@types/node": "^20.11.30",
    "@types/ws": "^8.5.13",
    "@vitest/coverage-v8": "^4.0.8",
    "adm-zip": "^0.5.16",
    "chalk": "^5.4.1",
    "eslint": "10.0.2",
    "jsdom": "^24.0.0",
    "playwright": "^1.52.0",
    "playwright-core": "^1.54.1",
    "prettier": "^3.2.5",
    "tsx": "*",
    "vitest": "^4.0.8",
    "zod": "^3.25.76 || ^4.2.0"
  },
  "repository": {
    "type": "git",
    "url": "git+https://github.com/browserbase/stagehand.git",
    "directory": "packages/core"
  },
  "bugs": {
    "url": "https://github.com/browserbase/stagehand/issues"
  },
  "homepage": "https://stagehand.dev"
}


================================================
FILE: packages/core/scripts/build-cjs.ts
================================================
/**
 * Build canonical dist/ (CJS) output for the core package (including tests).
 *
 * Prereqs: pnpm install; run gen-version + build-dom-scripts first (turbo handles).
 * Args: none.
 * Env: none.
 * Example: pnpm run build:cjs
 */
import fs from "node:fs";
import { spawnSync } from "node:child_process";
import { getRepoRootDir } from "../lib/v3/runtimePaths.js";

const repoRoot = getRepoRootDir();

const runNodeScript = (scriptPath: string, args: string[]) => {
  const result = spawnSync(process.execPath, [scriptPath, ...args], {
    stdio: "inherit",
    cwd: repoRoot,
  });
  if (result.error) {
    console.error(`Failed to run node ${scriptPath} ${args.join(" ")}`);
    console.error(result.error);
    process.exit(1);
  }
  if (result.status !== 0) {
    process.exit(result.status ?? 1);
  }
};

fs.rmSync(`${repoRoot}/packages/core/dist/cjs`, {
  recursive: true,
  force: true,
});
fs.mkdirSync(`${repoRoot}/packages/core/dist/cjs`, { recursive: true });

runNodeScript(`${repoRoot}/node_modules/typescript/bin/tsc`, [
  "-p",
  "packages/core/tsconfig.json",
  "--module",
  "commonjs",
  "--declaration",
  "--outDir",
  "packages/core/dist/cjs",
]);

fs.writeFileSync(
  `${repoRoot}/packages/core/dist/cjs/index.js`,
  `"use strict";
module.exports = require("./lib/v3/index.js");
`,
);
fs.writeFileSync(
  `${repoRoot}/packages/core/dist/cjs/cli.js`,
  `#!/usr/bin/env node
"use strict";
require("./lib/v3/cli.js");
`,
);
fs.writeFileSync(
  `${repoRoot}/packages/core/dist/cjs/index.d.ts`,
  `export * from "./lib/v3/index";
export { default } from "./lib/v3/index";
`,
);
fs.writeFileSync(
  `${repoRoot}/packages/core/dist/cjs/package.json`,
  '{\n  "type": "commonjs"\n}\n',
);

fs.mkdirSync(`${repoRoot}/packages/core/dist/cjs/lib/v3/dom/build`, {
  recursive: true,
});
if (fs.existsSync(`${repoRoot}/packages/core/lib/v3/dom/build`)) {
  for (const file of fs.readdirSync(
    `${repoRoot}/packages/core/lib/v3/dom/build`,
  )) {
    if (file.endsWith(".js")) {
      fs.copyFileSync(
        `${repoRoot}/packages/core/lib/v3/dom/build/${file}`,
        `${repoRoot}/packages/core/dist/cjs/lib/v3/dom/build/${file}`,
      );
    }
  }
}


================================================
FILE: packages/core/scripts/build-esm.ts
================================================
/**
 * Build canonical dist/esm output for the core package (including tests).
 *
 * Prereqs: pnpm install; run gen-version + build-dom-scripts first (turbo handles).
 * Args: none.
 * Env: none.
 * Example: pnpm run build:esm
 */
import fs from "node:fs";
import { spawnSync } from "node:child_process";
import { getRepoRootDir } from "../lib/v3/runtimePaths.js";

const repoRoot = getRepoRootDir();

const runNodeScript = (scriptPath: string, args: string[]) => {
  const result = spawnSync(process.execPath, [scriptPath, ...args], {
    stdio: "inherit",
    cwd: repoRoot,
  });
  if (result.error) {
    console.error(`Failed to run node ${scriptPath} ${args.join(" ")}`);
    console.error(result.error);
    process.exit(1);
  }
  if (result.status !== 0) {
    process.exit(result.status ?? 1);
  }
};

fs.rmSync(`${repoRoot}/packages/core/dist/esm`, {
  recursive: true,
  force: true,
});

// Core ESM emit includes generated lib/version.ts from gen-version (run in core build).
runNodeScript(`${repoRoot}/node_modules/typescript/bin/tsc`, [
  "-p",
  "packages/core/tsconfig.json",
  "--declaration",
]);

fs.mkdirSync(`${repoRoot}/packages/core/dist/esm`, { recursive: true });
fs.writeFileSync(
  `${repoRoot}/packages/core/dist/esm/package.json`,
  '{\n  "type": "module"\n}\n',
);
fs.writeFileSync(
  `${repoRoot}/packages/core/dist/esm/index.js`,
  `export * from "./lib/v3/index.js";
export { default } from "./lib/v3/index.js";
`,
);
fs.writeFileSync(
  `${repoRoot}/packages/core/dist/esm/index.d.ts`,
  `export * from "./lib/v3/index.js";
export { default } from "./lib/v3/index.js";
`,
);

fs.mkdirSync(`${repoRoot}/packages/core/dist/esm/lib/v3/dom/build`, {
  recursive: true,
});
// DOM script bundles are generated artifacts (not TS emit); copy into dist/esm for runtime.
if (fs.existsSync(`${repoRoot}/packages/core/lib/v3/dom/build`)) {
  for (const file of fs.readdirSync(
    `${repoRoot}/packages/core/lib/v3/dom/build`,
  )) {
    if (file.endsWith(".js")) {
      fs.copyFileSync(
        `${repoRoot}/packages/core/lib/v3/dom/build/${file}`,
        `${repoRoot}/packages/core/dist/esm/lib/v3/dom/build/${file}`,
      );
    }
  }
}

// Note: evals + server test outputs are built by their respective packages.


================================================
FILE: packages/core/scripts/coverage.ts
================================================
/**
 * Coverage merge (V8 -> Istanbul).
 *
 * Prereqs: V8 coverage JSON files in `coverage/**` (from test scripts).
 * Args: `merge` only.
 * Env: none required.
 * Example: pnpm run coverage:merge
 */
import fs from "node:fs";
import { spawn, type ChildProcess } from "node:child_process";
import normalizeV8Coverage from "./normalize-v8-coverage.js";
import { getRepoRootDir } from "../lib/v3/runtimePaths.js";

const repoRoot = getRepoRootDir();
const command = process.argv[2];
const terminationSignals: NodeJS.Signals[] = ["SIGINT", "SIGTERM"];
const log = (message: string) => console.log(`[coverage:merge] ${message}`);

let activeChild: ChildProcess | null = null;
let isCancelling = false;

const exitCodeForSignal = (signal: NodeJS.Signals): number =>
  signal === "SIGINT" ? 130 : 143;

const handleTermination = (signal: NodeJS.Signals) => {
  isCancelling = true;
  log(`received ${signal}, exiting`);
  if (activeChild && activeChild.pid && !activeChild.killed) {
    activeChild.kill(signal);
  }
  process.exit(exitCodeForSignal(signal));
};

terminationSignals.forEach((signal) => {
  process.once(signal, () => handleTermination(signal));
});

const assertNotCancelling = () => {
  if (isCancelling) {
    throw new Error("Coverage merge cancelled");
  }
};

if (!command || command !== "merge") {
  console.error("Usage: coverage merge");
  process.exit(1);
}

if (!process.env.V8_COVERAGE_SCAN_LIMIT) {
  process.env.V8_COVERAGE_SCAN_LIMIT = "2000";
}
fs.rmSync(`${repoRoot}/coverage/merged`, { recursive: true, force: true });
fs.rmSync(`${repoRoot}/coverage/.v8-tmp`, { recursive: true, force: true });
log(`normalizing v8 coverage in ${repoRoot}/coverage`);
log(`using V8_COVERAGE_SCAN_LIMIT=${process.env.V8_COVERAGE_SCAN_LIMIT}`);
const normalizeStart = Date.now();
await normalizeV8Coverage(`${repoRoot}/coverage`);
log(`normalize completed in ${Date.now() - normalizeStart}ms`);
const collectV8CoverageFiles = (dir: string): string[] => {
  const results: string[] = [];
  if (!fs.existsSync(dir)) return results;
  const walk = (current: string) => {
    assertNotCancelling();
    const entries = fs.readdirSync(current, { withFileTypes: true });
    for (const entry of entries) {
      assertNotCancelling();
      const fullPath = `${current}/${entry.name}`;
      if (entry.isDirectory()) {
        if (entry.name === ".v8-tmp" || entry.name === "merged") {
          continue;
        }
        walk(fullPath);
        continue;
      }
      if (!entry.isFile() || !entry.name.endsWith(".json")) continue;
      try {
        const raw = fs.readFileSync(fullPath, "utf8");
        if (!raw.trim()) continue;
        const parsed = JSON.parse(raw) as { result?: unknown };
        if (parsed?.result) results.push(fullPath);
      } catch {
        // ignore invalid JSON in coverage dir
      }
    }
  };
  walk(dir);
  return results;
};

const v8CoverageFiles = collectV8CoverageFiles(`${repoRoot}/coverage`);
if (v8CoverageFiles.length === 0) {
  console.log("No V8 coverage files found.");
  process.exit(0);
}
log(`found ${v8CoverageFiles.length} v8 coverage files`);

fs.mkdirSync(`${repoRoot}/coverage/merged`, { recursive: true });
fs.rmSync(`${repoRoot}/coverage/.v8-tmp`, { recursive: true, force: true });
fs.mkdirSync(`${repoRoot}/coverage/.v8-tmp`, { recursive: true });
v8CoverageFiles.forEach((file, index) => {
  assertNotCancelling();
  fs.copyFileSync(file, `${repoRoot}/coverage/.v8-tmp/coverage-${index}.json`);
});
log(`copied files to ${repoRoot}/coverage/.v8-tmp`);

const runC8Report = async () => {
  assertNotCancelling();
  log("running c8 report merge");
  const args = [
    "exec",
    "c8",
    "report",
    "--temp-directory",
    `${repoRoot}/coverage/.v8-tmp`,
    "--merge-async",
    "--reporter=html",
    "--reporter=lcov",
    "--reporter=json",
    "--reporter=text-summary",
    "--reports-dir",
    `${repoRoot}/coverage/merged`,
    "--cwd",
    repoRoot,
    "--include",
    "packages/**",
    "--exclude",
    "**/node_modules/**",
    "--exclude",
    "**/dist/**",
    "--exclude",
    "**/examples/**",
    "--exclude",
    "**/scripts/**",
    "--exclude",
    "packages/**/test/**",
    "--exclude",
    "packages/**/tests/**",
    "--exclude",
    "packages/**/examples/**",
    "--exclude",
    "packages/**/lib/**/tests/**",
    "--exclude",
    "packages/**/scripts/**",
    "--exclude-after-remap",
    "--exclude",
    "**/*.d.ts",
  ];
  let stdout = "";

  const status = await new Promise<number>((resolve, reject) => {
    const child = spawn("pnpm", args, {
      cwd: repoRoot,
      stdio: ["ignore", "pipe", "pipe"],
    });
    activeChild = child;

    child.stdout?.on("data", (chunk) => {
      const text = String(chunk);
      stdout += text;
      process.stdout.write(text);
    });
    child.stderr?.on("data", (chunk) => {
      process.stderr.write(String(chunk));
    });

    child.once("error", (error) => {
      activeChild = null;
      reject(error);
    });
    child.once("close", (code) => {
      activeChild = null;
      resolve(code ?? 1);
    });
  });

  if (stdout) {
    fs.writeFileSync(
      `${repoRoot}/coverage/merged/coverage-summary.txt`,
      stdout,
    );
  }
  log(`c8 report completed with status ${status}`);
  return status;
};

try {
  const status = await runC8Report();
  process.exit(status);
} catch (error) {
  const message = error instanceof Error ? error.message : String(error);
  if (!isCancelling) {
    console.error(`Failed to run c8 coverage report: ${message}`);
  }
  process.exit(1);
}


================================================
FILE: packages/core/scripts/gen-version.ts
================================================
import { readFileSync, writeFileSync } from "node:fs";
import { getPackageRootDir } from "../lib/v3/runtimePaths.js";

type PackageJson = { version: string };

const packageRoot = getPackageRootDir();
const pkgPath = `${packageRoot}/package.json`;
const pkg: PackageJson = JSON.parse(readFileSync(pkgPath, "utf8"));

const fullVersion: `${string}` = pkg.version;

const banner = `/**
 * AUTO-GENERATED — DO NOT EDIT BY HAND
 *  Run \`pnpm run gen-version\` to refresh.
 */
export const STAGEHAND_VERSION = "${fullVersion}" as const;
`;

writeFileSync(`${packageRoot}/lib/version.ts`, banner);


================================================
FILE: packages/core/scripts/normalize-v8-coverage.ts
================================================
/**
 * Normalize V8 coverage ranges using sourcemaps to avoid offset/1x floor issues.
 *
 * Prereqs: V8 coverage JSON files plus JS files with inline or external sourcemaps.
 * Args: --coverage-dir <dir> (or NODE_V8_COVERAGE).
 * Env: NODE_V8_COVERAGE, V8_COVERAGE_SCAN_LIMIT.
 * Example: tsx packages/core/scripts/normalize-v8-coverage.ts --coverage-dir coverage/e2e-local
 */
import fs from "node:fs";
import path from "node:path";
import { fileURLToPath } from "node:url";
import {
  SourceMapConsumer,
  type RawIndexMap,
  type RawSourceMap,
} from "source-map";
import { getRepoRootDir, isMainModule } from "../lib/v3/runtimePaths.js";

type CoverageRange = {
  startOffset: number;
  endOffset: number;
  count: number;
};

type CoverageEntry = {
  url?: string;
  functions?: Array<{
    ranges?: CoverageRange[];
  }>;
};

type CoverageFile = {
  result?: CoverageEntry[];
};

const toFilePath = (urlOrPath: string): string | null => {
  if (!urlOrPath) return null;
  if (urlOrPath.startsWith("node:")) return null;
  if (urlOrPath.startsWith("file:")) {
    try {
      return fileURLToPath(urlOrPath);
    } catch {
      return null;
    }
  }
  return path.isAbsolute(urlOrPath) ? urlOrPath : null;
};

type SourceMapPayload = RawSourceMap | RawIndexMap;

const readSourceMap = (jsPath: string): SourceMapPayload | null => {
  if (!fs.existsSync(jsPath)) return null;
  const source = fs.readFileSync(jsPath, "utf8");
  const inlineMatch = source.match(
    /sourceMappingURL=data:application\/json;base64,([A-Za-z0-9+/=]+)/,
  );
  if (inlineMatch) {
    return JSON.parse(
      Buffer.from(inlineMatch[1], "base64").toString("utf8"),
    ) as SourceMapPayload;
  }
  const mapMatch = source.match(/sourceMappingURL=([^\s]+)/);
  if (!mapMatch) return null;
  const mapFile = mapMatch[1].trim();
  if (mapFile.startsWith("data:")) return null;
  const mapPath = path.resolve(path.dirname(jsPath), mapFile);
  if (!fs.existsSync(mapPath)) return null;
  return JSON.parse(fs.readFileSync(mapPath, "utf8")) as SourceMapPayload;
};

const buildLineStarts = (source: string) => {
  const lineStarts = [0];
  for (let i = 0; i < source.length; i++) {
    if (source[i] === "\n") lineStarts.push(i + 1);
  }
  return lineStarts;
};

const offsetToLineCol = (lineStarts: number[], offset: number) => {
  let low = 0;
  let high = lineStarts.length - 1;
  while (low <= high) {
    const mid = Math.floor((low + high) / 2);
    const start = lineStarts[mid];
    const next = mid + 1 < lineStarts.length ? lineStarts[mid + 1] : Infinity;
    if (start <= offset && offset < next) {
      return { line: mid + 1, column: offset - start };
    }
    if (start > offset) {
      high = mid - 1;
    } else {
      low = mid + 1;
    }
  }
  return { line: 1, column: 0 };
};

const lineColToOffset = (
  lineStarts: number[],
  line: number,
  column: number,
  sourceLength: number,
) => {
  const lineIndex = Math.max(0, line - 1);
  const lineStart = lineStarts[lineIndex] ?? 0;
  const lineEnd =
    lineIndex + 1 < lineStarts.length
      ? lineStarts[lineIndex + 1] - 1
      : sourceLength;
  const clampedColumn = Math.max(0, Math.min(column, lineEnd - lineStart));
  return lineStart + clampedColumn;
};
type NormalizerOptions = {
  coverageDir: string;
  maxScan: number;
};

type SourceContext = {
  lineStarts: number[];
  sourceLength: number;
  consumer: SourceMapConsumer;
};

type MappedPosition = {
  source: string;
  line: number;
  column: number;
};

type OffsetMapping = {
  mapped: MappedPosition;
  offset: number;
};

const mapOriginalPosition = (
  consumer: SourceMapConsumer,
  line: number,
  column: number,
  bias: number,
) =>
  consumer.originalPositionFor({
    line,
    column,
    bias,
  });

const findMappedStart = (
  ctx: SourceContext,
  startOffset: number,
  endOffset: number,
  options: NormalizerOptions,
): OffsetMapping | null => {
  const maxScan = Math.min(
    options.maxScan,
    Math.max(0, endOffset - startOffset),
  );
  const startPos = offsetToLineCol(ctx.lineStarts, startOffset);
  let mapped = mapOriginalPosition(
    ctx.consumer,
    startPos.line,
    startPos.column,
    SourceMapConsumer.LEAST_UPPER_BOUND,
  );
  if (!mapped.source) {
    mapped = mapOriginalPosition(
      ctx.consumer,
      startPos.line,
      startPos.column,
      SourceMapConsumer.GREATEST_LOWER_BOUND,
    );
  }
  if (mapped.source) {
    return {
      mapped: {
        source: mapped.source,
        line: mapped.line ?? 1,
        column: mapped.column ?? 0,
      },
      offset: startOffset,
    };
  }

  const limit = Math.min(endOffset, startOffset + maxScan);
  for (let off = startOffset + 1; off <= limit; off++) {
    const pos = offsetToLineCol(ctx.lineStarts, off);
    mapped = mapOriginalPosition(
      ctx.consumer,
      pos.line,
      pos.column,
      SourceMapConsumer.LEAST_UPPER_BOUND,
    );
    if (!mapped.source) {
      mapped = mapOriginalPosition(
        ctx.consumer,
        pos.line,
        pos.column,
        SourceMapConsumer.GREATEST_LOWER_BOUND,
      );
    }
    if (mapped.source) {
      return {
        mapped: {
          source: mapped.source,
          line: mapped.line ?? 1,
          column: mapped.column ?? 0,
        },
        offset: off,
      };
    }
  }

  return null;
};

const findMappedEnd = (
  ctx: SourceContext,
  startOffset: number,
  endOffset: number,
  options: NormalizerOptions,
  targetSource?: string,
): OffsetMapping | null => {
  const maxScan = Math.min(
    options.maxScan,
    Math.max(0, endOffset - startOffset),
  );
  const endPos = offsetToLineCol(ctx.lineStarts, endOffset);
  let mapped = mapOriginalPosition(
    ctx.consumer,
    endPos.line,
    endPos.column,
    SourceMapConsumer.GREATEST_LOWER_BOUND,
  );
  if (!mapped.source || (targetSource && mapped.source !== targetSource)) {
    mapped = mapOriginalPosition(
      ctx.consumer,
      endPos.line,
      endPos.column,
      SourceMapConsumer.LEAST_UPPER_BOUND,
    );
  }
  if (mapped.source && (!targetSource || mapped.source === targetSource)) {
    return {
      mapped: {
        source: mapped.source,
        line: mapped.line ?? 1,
        column: mapped.column ?? 0,
      },
      offset: endOffset,
    };
  }

  const limit = Math.max(startOffset, endOffset - maxScan);
  for (let off = endOffset - 1; off >= limit; off--) {
    const pos = offsetToLineCol(ctx.lineStarts, off);
    mapped = mapOriginalPosition(
      ctx.consumer,
      pos.line,
      pos.column,
      SourceMapConsumer.GREATEST_LOWER_BOUND,
    );
    if (!mapped.source || (targetSource && mapped.source !== targetSource)) {
      mapped = mapOriginalPosition(
        ctx.consumer,
        pos.line,
        pos.column,
        SourceMapConsumer.LEAST_UPPER_BOUND,
      );
    }
    if (mapped.source && (!targetSource || mapped.source === targetSource)) {
      return {
        mapped: {
          source: mapped.source,
          line: mapped.line ?? 1,
          column: mapped.column ?? 0,
        },
        offset: off,
      };
    }
  }

  return null;
};

const normalizeRange = (
  range: CoverageRange,
  ctx: SourceContext,
  options: NormalizerOptions,
) => {
  if (range.endOffset <= range.startOffset) return false;
  const startMapping = findMappedStart(
    ctx,
    range.startOffset,
    range.endOffset,
    options,
  );
  if (!startMapping) return false;
  const endMapping = findMappedEnd(
    ctx,
    range.startOffset,
    range.endOffset,
    options,
    startMapping.mapped.source,
  );
  if (!endMapping) return false;

  let startOffset = startMapping.offset;
  let endOffset = endMapping.offset;

  if (range.count === 0) {
    const genStart = ctx.consumer.generatedPositionFor({
      source: startMapping.mapped.source,
      line: startMapping.mapped.line,
      column: 0,
      bias: SourceMapConsumer.LEAST_UPPER_BOUND,
    });
    const genEnd = ctx.consumer.generatedPositionFor({
      source: startMapping.mapped.source,
      line: endMapping.mapped.line ?? startMapping.mapped.line,
      column: Number.MAX_SAFE_INTEGER,
      bias: SourceMapConsumer.GREATEST_LOWER_BOUND,
    });
    if (genStart.line && genEnd.line) {
      const expandedStart = lineColToOffset(
        ctx.lineStarts,
        genStart.line,
        genStart.column ?? 0,
        ctx.sourceLength,
      );
      const expandedEnd = lineColToOffset(
        ctx.lineStarts,
        genEnd.line,
        genEnd.column ?? 0,
        ctx.sourceLength,
      );
      startOffset = Math.min(startOffset, expandedStart);
      endOffset = Math.max(endOffset, expandedEnd);
    }
  }

  if (endOffset <= startOffset) return false;
  if (startOffset !== range.startOffset || endOffset !== range.endOffset) {
    range.startOffset = startOffset;
    range.endOffset = endOffset;
    return true;
  }
  return false;
};

const normalizeCoverageDir = async (options: NormalizerOptions) => {
  if (!fs.existsSync(options.coverageDir)) return;
  const jsonFiles: string[] = [];
  const walk = (dir: string) => {
    for (const entry of fs.readdirSync(dir, { withFileTypes: true })) {
      const full = `${dir}/${entry.name}`;
      if (entry.isDirectory()) {
        if (entry.name === ".v8-tmp" || entry.name === "merged") {
          continue;
        }
        walk(full);
      } else if (entry.isFile() && entry.name.endsWith(".json")) {
        jsonFiles.push(full);
      }
    }
  };
  walk(options.coverageDir);
  if (jsonFiles.length === 0) return;

  const sourceCache = new Map<string, SourceContext | null>();
  try {
    for (const file of jsonFiles) {
      const data = JSON.parse(fs.readFileSync(file, "utf8")) as CoverageFile;
      if (!Array.isArray(data.result)) continue;
      let updated = false;

      for (const entry of data.result) {
        const jsPath = entry.url ? toFilePath(entry.url) : null;
        if (!jsPath) continue;
        let ctx = sourceCache.get(jsPath);
        if (ctx === undefined) {
          const map = readSourceMap(jsPath);
          if (!map) {
            sourceCache.set(jsPath, null);
            continue;
          }
          const source = fs.readFileSync(jsPath, "utf8");
          ctx = {
            lineStarts: buildLineStarts(source),
            sourceLength: source.length,
            consumer: await new SourceMapConsumer(map),
          };
          sourceCache.set(jsPath, ctx);
        }
        if (!ctx) continue;
        if (!entry?.functions) continue;
        for (const block of entry.functions) {
          if (!block?.ranges) continue;
          for (const range of block.ranges) {
            if (normalizeRange(range, ctx, options)) {
              updated = true;
            }
          }
        }
      }

      if (updated) {
        fs.writeFileSync(file, JSON.stringify(data));
      }
    }
  } finally {
    for (const ctx of sourceCache.values()) {
      ctx?.consumer.destroy();
    }
  }
};

export const normalizeV8Coverage = async (coverageDir: string) => {
  const repoRoot = getRepoRootDir();
  const resolvedDir = path.isAbsolute(coverageDir)
    ? coverageDir
    : path.resolve(repoRoot, coverageDir);
  const maxScan = Number(process.env.V8_COVERAGE_SCAN_LIMIT ?? 20000);
  await normalizeCoverageDir({ coverageDir: resolvedDir, maxScan });
};

export default normalizeV8Coverage;

const main = async () => {
  const args = process.argv.slice(2);
  const idx = args.indexOf("--coverage-dir");
  const coverageDir =
    (idx >= 0 ? args[idx + 1] : undefined) ?? process.env.NODE_V8_COVERAGE;
  if (!coverageDir) {
    console.error(
      "Missing coverage dir (use --coverage-dir or NODE_V8_COVERAGE).",
    );
    process.exit(1);
  }
  await normalizeV8Coverage(coverageDir);
};

if (isMainModule()) {
  main().catch((error) => {
    console.error(error);
    process.exit(1);
  });
}


================================================
FILE: packages/core/scripts/prepare.js
================================================
import { spawnSync } from "node:child_process";

const isCi =
  process.env.CI === "true" ||
  process.env.CI === "1" ||
  process.env.SKIP_PREPARE === "1";

if (isCi) {
  console.log("Skipping prepare script in CI.");
  process.exit(0);
}

const result = spawnSync("pnpm", ["run", "build"], {
  stdio: "inherit",
  shell: process.platform === "win32",
});

process.exit(result.status ?? 1);


================================================
FILE: packages/core/scripts/test-core.ts
================================================
/**
 * Core unit tests (Vitest) on dist/esm tests.
 *
 * Prereqs: pnpm run build:esm (packages/core/dist/esm/tests/unit present).
 * Args: [test paths...] -- [vitest args...] | --list (prints JSON matrix)
 * Env: NODE_V8_COVERAGE, NODE_OPTIONS, VITEST_CONSOLE_REPORTER;
 *      writes CTRF to ctrf/vitest-core.xml by default.
 * Example: pnpm run test:core -- packages/core/dist/esm/tests/unit/foo.test.js -- --reporter=junit
 */
import fs from "node:fs";
import path from "node:path";
import { spawnSync } from "node:child_process";
import {
  ensureParentDir,
  parseListFlag,
  splitArgs,
  collectFiles,
  toSafeName,
  normalizeVitestArgs,
  findJunitPath,
  hasReporterName,
  writeCtrfFromJunit,
} from "./test-utils.js";
import { getRepoRootDir } from "../lib/v3/runtimePaths.js";

const repoRoot = getRepoRootDir();

const sourceTestsDir = `${repoRoot}/packages/core/tests/unit`;
const testsDir = `${repoRoot}/packages/core/dist/esm/tests/unit`;
const defaultConfigPath = `${repoRoot}/packages/core/vitest.esm.config.mjs`;

const resolveRepoRelative = (value: string) =>
  path.isAbsolute(value) ? value : path.resolve(repoRoot, value);

const hasConfigArg = (argsList: string[]) =>
  argsList.some((arg, i) => {
    if (arg.startsWith("--config=")) return true;
    return arg === "--config" && Boolean(argsList[i + 1]);
  });

const toTestName = (testPath: string) => {
  const abs = resolveRepoRelative(testPath);
  const rel = path.relative(testsDir, abs).replaceAll("\\", "/");
  if (!rel.startsWith("..")) {
    return rel.replace(/\.test\.(ts|js)$/i, "");
  }
  return path.basename(abs).replace(/\.test\.(ts|js)$/i, "");
};

const listFlag = parseListFlag(process.argv.slice(2));
const { paths, extra } = splitArgs(listFlag.args);

if (listFlag.list) {
  const tests = collectFiles(sourceTestsDir, ".test.ts");
  const entries = tests.map((file) => {
    const relSource = path.relative(sourceTestsDir, file).replaceAll("\\", "/");
    const rel = relSource.replace(/\.test\.ts$/, "");
    const distPath = `${testsDir}/${relSource.replace(/\.test\.ts$/, ".test.js")}`;
    return {
      path: path.relative(repoRoot, distPath).replaceAll("\\", "/"),
      name: rel,
      safe_name: toSafeName(rel),
    };
  });
  console.log(JSON.stringify(entries));
  process.exit(0);
}

if (!fs.existsSync(testsDir)) {
  console.error(
    "Missing packages/core/dist/esm/tests/unit. Run pnpm run build:esm first.",
  );
  process.exit(1);
}

const runtimePaths = paths.map(resolveRepoRelative);
const hasUserConfig = hasConfigArg(extra);

const baseNodeOptions = "--enable-source-maps";
const nodeOptions = [process.env.NODE_OPTIONS, baseNodeOptions]
  .filter(Boolean)
  .join(" ");

const relTestName = paths.length === 1 ? toTestName(paths[0]) : null;

const coverageDir = resolveRepoRelative(
  process.env.NODE_V8_COVERAGE ??
    (relTestName
      ? `${repoRoot}/coverage/core-unit/${relTestName}`
      : `${repoRoot}/coverage/core-unit`),
);
fs.mkdirSync(coverageDir, { recursive: true });

const normalizedExtra = normalizeVitestArgs(repoRoot, extra);
const defaultJunitPath = (() => {
  if (!relTestName) {
    return `${repoRoot}/ctrf/core-unit/all.xml`;
  }
  return `${repoRoot}/ctrf/core-unit/${relTestName}.xml`;
})();
const hasOutput = Boolean(findJunitPath(normalizedExtra));
const vitestArgs = [...normalizedExtra];
const consoleReporter = process.env.VITEST_CONSOLE_REPORTER ?? "default";
if (!hasReporterName(vitestArgs, consoleReporter)) {
  vitestArgs.push(`--reporter=${consoleReporter}`);
}
if (!hasReporterName(vitestArgs, "junit")) {
  vitestArgs.push("--reporter=junit");
}
if (!hasOutput) {
  ensureParentDir(defaultJunitPath);
  vitestArgs.push(`--outputFile.junit=${defaultJunitPath}`);
}
const junitPath = findJunitPath(vitestArgs) ?? defaultJunitPath;

const env = {
  ...process.env,
  NODE_OPTIONS: nodeOptions,
  NODE_V8_COVERAGE: coverageDir,
};

const result = spawnSync(
  "pnpm",
  [
    "--filter",
    "@browserbasehq/stagehand",
    "exec",
    "vitest",
    "run",
    ...(hasUserConfig ? [] : ["--config", defaultConfigPath]),
    ...vitestArgs,
    ...runtimePaths,
  ],
  { stdio: "inherit", env },
);

writeCtrfFromJunit(junitPath, "vitest");

process.exit(result.status ?? 1);


================================================
FILE: packages/core/scripts/test-e2e.ts
================================================
/**
 * E2E tests (Playwright) on dist/esm tests.
 *
 * Prereqs: pnpm run build:esm (packages/core/dist/esm/tests/integration present).
 * Args: [test paths...] -- [playwright args...] | --list (prints JSON matrix).
 * Env: STAGEHAND_BROWSER_TARGET=local|browserbase, CHROME_PATH (local),
 *      NODE_V8_COVERAGE, PLAYWRIGHT_CONSOLE_REPORTER;
 *      writes CTRF to ctrf/playwright-*.xml by default.
 * Example: STAGEHAND_BROWSER_TARGET=browserbase pnpm run test:e2e -- packages/core/dist/esm/tests/integration/foo.spec.js
 */
import fs from "node:fs";
import path from "node:path";
import { spawnSync } from "node:child_process";
import {
  ensureParentDir,
  parseListFlag,
  splitArgs,
  collectFiles,
  toSafeName,
  writeCtrfFromJunit,
} from "./test-utils.js";
import {
  createRequireFromCaller,
  getRepoRootDir,
} from "../lib/v3/runtimePaths.js";

const repoRoot = getRepoRootDir();

const sourceTestsDir = `${repoRoot}/packages/core/tests/integration`;
const testsDir = `${repoRoot}/packages/core/dist/esm/tests/integration`;
const defaultConfigPath = `${repoRoot}/packages/core/dist/esm/tests/integration/v3.playwright.config.js`;

const resolveRepoRelative = (value: string) =>
  path.isAbsolute(value) ? value : path.resolve(repoRoot, value);
const require = createRequireFromCaller();
const playwrightCliPath = require.resolve("@playwright/test/cli");

const hasConfigArg = (argsList: string[]) =>
  argsList.some((arg, i) => {
    if (arg.startsWith("--config=")) return true;
    return arg === "--config" && Boolean(argsList[i + 1]);
  });

const stripReporterArgs = (argsList: string[]) => {
  const filtered: string[] = [];
  let removed = false;
  for (let i = 0; i < argsList.length; i++) {
    const arg = argsList[i];
    if (
      arg === "--reporter" ||
      arg === "-r" ||
      arg.startsWith("--reporter=") ||
      arg.startsWith("-r=")
    ) {
      removed = true;
      if ((arg === "--reporter" || arg === "-r") && argsList[i + 1]) {
        i += 1;
      }
      continue;
    }
    filtered.push(arg);
  }
  return { filtered, removed };
};

const toTestName = (testPath: string) => {
  const abs = resolveRepoRelative(testPath);
  const rel = path.relative(testsDir, abs).replaceAll("\\", "/");
  if (!rel.startsWith("..")) {
    return rel.replace(/\.spec\.(ts|js)$/i, "");
  }
  return path.basename(abs).replace(/\.spec\.(ts|js)$/i, "");
};

const toPlaywrightPath = (testPath: string) => {
  const abs = resolveRepoRelative(testPath);
  const rel = path.relative(testsDir, abs).replaceAll("\\", "/");
  const value = rel.startsWith("..") ? abs : rel;
  return value.replace(/(\.spec|\.test)\.(ts|js)$/i, "$1");
};

const listFlag = parseListFlag(process.argv.slice(2));
const { paths, extra } = splitArgs(listFlag.args);

if (listFlag.list) {
  const tests = collectFiles(sourceTestsDir, ".spec.ts");
  const entries = tests.map((file) => {
    const relSource = path.relative(sourceTestsDir, file).replaceAll("\\", "/");
    const rel = relSource.replace(/\.spec\.ts$/, "");
    const distPath = `${testsDir}/${relSource.replace(/\.spec\.ts$/, ".spec.js")}`;
    return {
      path: path.relative(repoRoot, distPath).replaceAll("\\", "/"),
      name: rel,
      safe_name: toSafeName(rel),
    };
  });
  console.log(JSON.stringify(entries));
  process.exit(0);
}

if (!fs.existsSync(testsDir)) {
  console.error(
    "Missing packages/core/dist/esm/tests/integration. Run pnpm run build:esm first.",
  );
  process.exit(1);
}

const { filtered: extraArgs, removed: removedReporterOverride } =
  stripReporterArgs(extra);
if (removedReporterOverride) {
  console.warn(
    "Ignoring Playwright --reporter override to preserve console + JUnit output.",
  );
}

const hasUserConfig = hasConfigArg(extraArgs);
if (!hasUserConfig && !fs.existsSync(defaultConfigPath)) {
  console.error(`Missing Playwright config at ${defaultConfigPath}.`);
  process.exit(1);
}

const playwrightPaths = paths.map(toPlaywrightPath);

const target = (process.env.STAGEHAND_BROWSER_TARGET ?? "local").toLowerCase();
const useBrowserbase = target === "browserbase";
const relTestName = paths.length === 1 ? toTestName(paths[0]) : null;

const coverageDir = resolveRepoRelative(
  process.env.NODE_V8_COVERAGE ??
    (relTestName
      ? `${repoRoot}/coverage/${useBrowserbase ? "e2e-bb" : "e2e-local"}/${relTestName}`
      : `${repoRoot}/coverage/${useBrowserbase ? "e2e-bb" : "e2e-local"}`),
);
fs.mkdirSync(coverageDir, { recursive: true });

const defaultJunitPath = relTestName
  ? `${repoRoot}/ctrf/${useBrowserbase ? "e2e-bb" : "e2e-local"}/${relTestName}.xml`
  : `${repoRoot}/ctrf/${useBrowserbase ? "e2e-bb" : "e2e-local"}/all.xml`;
const ctrfPath = process.env.CTRF_JUNIT_PATH
  ? resolveRepoRelative(process.env.CTRF_JUNIT_PATH)
  : defaultJunitPath;
ensureParentDir(ctrfPath);

const baseNodeOptions = "--enable-source-maps";
const nodeOptions = [process.env.NODE_OPTIONS, baseNodeOptions]
  .filter(Boolean)
  .join(" ");

const env = {
  ...process.env,
  NODE_OPTIONS: nodeOptions,
  NODE_V8_COVERAGE: coverageDir,
  CTRF_JUNIT_PATH: ctrfPath,
};

const result = spawnSync(
  process.execPath,
  [
    playwrightCliPath,
    "test",
    ...(hasUserConfig ? [] : ["--config", defaultConfigPath]),
    ...extraArgs,
    ...playwrightPaths,
  ],
  { stdio: "inherit", env, cwd: repoRoot },
);

writeCtrfFromJunit(ctrfPath, "playwright");

process.exit(result.status ?? 1);


================================================
FILE: packages/core/scripts/test-utils.ts
================================================
/**
 * Shared helpers for scripts (not a runnable script).
 *
 * Prereqs: none.
 * Args: n/a.
 * Env: n/a.
 */
import fs from "node:fs";
import path from "node:path";
import { spawnSync } from "node:child_process";
import { getRepoRootDir } from "../lib/v3/runtimePaths.js";

const workspaceRoot = getRepoRootDir();

export const ensureParentDir = (filePath: string) => {
  fs.mkdirSync(path.dirname(filePath), { recursive: true });
};

export const splitArgs = (args: string[]) => {
  const tokens = [...args];
  while (tokens[0] === "--") {
    tokens.shift();
  }

  const leadingExtra: string[] = [];
  while (tokens.length > 0 && tokens[0].startsWith("-")) {
    const arg = tokens.shift();
    if (!arg) break;
    if (arg === "--") break;
    leadingExtra.push(arg);
    if (
      !arg.includes("=") &&
      tokens[0] &&
      tokens[0] !== "--" &&
      !tokens[0].startsWith("-")
    ) {
      leadingExtra.push(tokens.shift() as string);
    }
  }

  while (tokens[0] === "--") {
    tokens.shift();
  }

  const separatorIndex = tokens.indexOf("--");
  return {
    paths: separatorIndex === -1 ? tokens : tokens.slice(0, separatorIndex),
    extra: [
      ...leadingExtra,
      ...(separatorIndex === -1 ? [] : tokens.slice(separatorIndex + 1)),
    ],
  };
};

export const parseListFlag = (args: string[]) => {
  const remaining: string[] = [];
  let value: string | null = null;
  for (let i = 0; i < args.length; i++) {
    const arg = args[i];
    if (arg === "--list") {
      const next = args[i + 1];
      if (next && !next.startsWith("--")) {
        value = next;
        i += 1;
      } else {
        value = "";
      }
      continue;
    }
    if (arg.startsWith("--list=")) {
      value = arg.slice("--list=".length);
      continue;
    }
    remaining.push(arg);
  }
  return { list: value !== null, value: value ?? "", args: remaining };
};

export const toSafeName = (name: string) => name.replace(/[\\/]/g, "-");

export const collectFiles = (dir: string, suffix: string) => {
  const results: string[] = [];
  const walk = (current: string) => {
    for (const entry of fs.readdirSync(current, { withFileTypes: true })) {
      const full = `${current}/${entry.name}`;
      if (entry.isDirectory()) {
        walk(full);
      } else if (entry.isFile() && entry.name.endsWith(suffix)) {
        results.push(full);
      }
    }
  };
  if (fs.existsSync(dir)) walk(dir);
  return results.sort();
};

export const normalizeVitestArgs = (repoRoot: string, argsList: string[]) => {
  const normalized = [...argsList];
  const prefix = "--outputFile.junit=";
  for (let i = 0; i < normalized.length; i++) {
    const arg = normalized[i];
    if (arg.startsWith(prefix)) {
      const value = arg.slice(prefix.length);
      const resolved = path.isAbsolute(value)
        ? value
        : path.resolve(repoRoot, value);
      ensureParentDir(resolved);
      normalized[i] = `${prefix}${resolved}`;
      continue;
    }
    if (arg === "--outputFile.junit" && normalized[i + 1]) {
      const resolved = path.isAbsolute(normalized[i + 1])
        ? normalized[i + 1]
        : path.resolve(repoRoot, normalized[i + 1]);
      ensureParentDir(resolved);
      normalized[i + 1] = resolved;
      i += 1;
    }
  }
  return normalized;
};

export const findJunitPath = (argsList: string[]) => {
  const prefix = "--outputFile.junit=";
  for (let i = 0; i < argsList.length; i++) {
    const arg = argsList[i];
    if (arg.startsWith(prefix)) {
      return arg.slice(prefix.length);
    }
    if (arg === "--outputFile.junit" && argsList[i + 1]) {
      return argsList[i + 1];
    }
  }
  return null;
};

const parseReporters = (argsList: string[]) => {
  const reporters: string[] = [];
  for (let i = 0; i < argsList.length; i++) {
    const arg = argsList[i];
    if (arg.startsWith("--reporter=")) {
      reporters.push(arg.slice("--reporter=".length));
      continue;
    }
    if (arg === "--reporter" && argsList[i + 1]) {
      reporters.push(argsList[i + 1]);
      i += 1;
    }
  }
  return reporters
    .flatMap((value) => value.split(","))
    .map((value) => value.trim())
    .filter(Boolean);
};

export const hasReporterName = (argsList: string[], reporter: string) =>
  parseReporters(argsList).some((value) => value === reporter);

export const writeCtrfFromJunit = (junitPath: string, tool: string) => {
  if (!fs.existsSync(junitPath)) return;
  const stat = fs.statSync(junitPath);
  if (stat.size === 0) return;
  const ctrfPath = junitPath.match(/\.xml$/i)
    ? junitPath.replace(/\.xml$/i, ".json")
    : `${junitPath}.json`;
  const result = spawnSync(
    "pnpm",
    ["exec", "junit-to-ctrf", junitPath, "-o", ctrfPath, "-t", tool],
    { stdio: "inherit", cwd: workspaceRoot },
  );
  if (result.status !== 0) {
    console.warn(`CTRF conversion failed for ${junitPath}.`);
  }
};


================================================
FILE: packages/core/tests/cache-variables.test.ts
================================================
import { describe, expect, it, vi } from "vitest";
import { ActCache } from "../lib/v3/cache/ActCache";
import type { CacheStorage } from "../lib/v3/cache/CacheStorage";
import type { ActHandler } from "../lib/v3/handlers/actHandler";
import type { LLMClient } from "../lib/v3/llm/LLMClient";
import type { Page } from "../lib/v3/understudy/page";
import type { ActCacheContext, CachedActEntry } from "../lib/v3/types/private";
import type { Action } from "../lib/v3/types/public";

function createFakeStorage<T>(entry: T): CacheStorage {
  return {
    enabled: true,
    readJson: vi.fn().mockResolvedValue({ value: entry }),
    writeJson: vi.fn().mockResolvedValue({}),
    directory: "/tmp/cache",
  } as unknown as CacheStorage;
}

describe("ActCache variable handling", () => {
  it("cache key includes variable keys but not values", async () => {
    const storage = {
      enabled: true,
      readJson: vi.fn(),
      writeJson: vi.fn().mockResolvedValue({}),
      directory: "/tmp/cache",
    } as unknown as CacheStorage;

    const cache = new ActCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => null as unknown as ActHandler,
      getDefaultLlmClient: () => ({}) as LLMClient,
      domSettleTimeoutMs: undefined,
    });

    const fakePage = {
      url: vi.fn().mockResolvedValue("https://example.com"),
    } as unknown as Page;

    // First context with username="user1@example.com"
    const context1 = await cache.prepareContext(
      "type %username% into the email field",
      fakePage,
      { username: "user1@example.com" },
    );

    // Second context with username="user2@example.com"
    const context2 = await cache.prepareContext(
      "type %username% into the email field",
      fakePage,
      { username: "user2@example.com" },
    );

    // Third context with different variable key name
    const context3 = await cache.prepareContext(
      "type %email% into the email field",
      fakePage,
      { email: "user3@example.com" },
    );

    // Same instruction + same variable keys = same cache key
    expect(context1?.cacheKey).toBe(context2?.cacheKey);

    // Different variable keys = different cache key
    expect(context1?.cacheKey).not.toBe(context3?.cacheKey);

    // Verify variable keys are sorted and stored
    expect(context1?.variableKeys).toEqual(["username"]);
    expect(context2?.variableKeys).toEqual(["username"]);
    expect(context3?.variableKeys).toEqual(["email"]);

    // Verify variable values are preserved in context
    expect(context1?.variables).toEqual({ username: "user1@example.com" });
    expect(context2?.variables).toEqual({ username: "user2@example.com" });
  });

  it("replays cached actions with variable substitution", async () => {
    // Cached action contains variable placeholder %username%
    const action: Action = {
      selector: "xpath=/html/body/input[@type='email']",
      description: "type username into email field",
      method: "type",
      arguments: ["%username%"], // Variable placeholder
    };

    const entry: CachedActEntry = {
      version: 1,
      instruction: "type %username% into the email field",
      url: "https://example.com",
      variableKeys: ["username"],
      actions: [action],
      actionDescription: "type username",
      message: "done",
    };

    const storage = createFakeStorage(entry);

    // Track what variables are passed to takeDeterministicAction
    const capturedVariables: Record<string, string>[] = [];
    const handler = {
      takeDeterministicAction: vi
        .fn()
        .mockImplementation(
          async (_action, _page, _timeout, _client, _ensure, variables) => {
            capturedVariables.push(variables || {});
            return {
              success: true,
              message: "ok",
              actionDescription: "type username",
              actions: [action],
            };
          },
        ),
    } as unknown as ActHandler;

    const defaultClient = {} as LLMClient;

    const cache = new ActCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => handler,
      getDefaultLlmClient: () => defaultClient,
      domSettleTimeoutMs: undefined,
    });

    // First replay with username="user1@example.com"
    const context1: ActCacheContext = {
      instruction: "type %username% into the email field",
      cacheKey: "test-key",
      pageUrl: "https://example.com",
      variableKeys: ["username"],
      variables: { username: "user1@example.com" },
    };

    const result1 = await cache.tryReplay(context1, {} as Page);

    expect(result1?.success).toBe(true);
    expect(handler.takeDeterministicAction).toHaveBeenCalledTimes(1);
    expect(capturedVariables[0]).toEqual({ username: "user1@example.com" });

    // Reset
    vi.clearAllMocks();
    capturedVariables.length = 0;

    // Second replay with username="user2@example.com"
    const context2: ActCacheContext = {
      instruction: "type %username% into the email field",
      cacheKey: "test-key", // Same cache key!
      pageUrl: "https://example.com",
      variableKeys: ["username"],
      variables: { username: "user2@example.com" },
    };

    const result2 = await cache.tryReplay(context2, {} as Page);

    expect(result2?.success).toBe(true);
    expect(handler.takeDeterministicAction).toHaveBeenCalledTimes(1);
    expect(capturedVariables[0]).toEqual({ username: "user2@example.com" });
  });

  it("cache miss when variable keys don't match", async () => {
    const action: Action = {
      selector: "xpath=/html/body/input",
      description: "type username",
      method: "type",
      arguments: ["%username%"],
    };

    // Cached entry expects "username" variable
    const entry: CachedActEntry = {
      version: 1,
      instruction: "type %username% into the field",
      url: "https://example.com",
      variableKeys: ["username"],
      actions: [action],
    };

    const storage = createFakeStorage(entry);
    const cache = new ActCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => null as unknown as ActHandler,
      getDefaultLlmClient: () => ({}) as LLMClient,
      domSettleTimeoutMs: undefined,
    });

    // Context has different variable key "email"
    const context: ActCacheContext = {
      instruction: "type %email% into the field",
      cacheKey: "test-key",
      pageUrl: "https://example.com",
      variableKeys: ["email"],
      variables: { email: "test@example.com" },
    };

    const result = await cache.tryReplay(context, {} as Page);

    // Should return null (cache miss) due to variable key mismatch
    expect(result).toBeNull();
  });

  it("cache miss when required variables are missing", async () => {
    const action: Action = {
      selector: "xpath=/html/body/input",
      description: "type username",
      method: "type",
      arguments: ["%username%"],
    };

    const entry: CachedActEntry = {
      version: 1,
      instruction: "type %username% into the field",
      url: "https://example.com",
      variableKeys: ["username"],
      actions: [action],
    };

    const storage = createFakeStorage(entry);
    const logger = vi.fn();
    const cache = new ActCache({
      storage,
      logger,
      getActHandler: () => null as unknown as ActHandler,
      getDefaultLlmClient: () => ({}) as LLMClient,
      domSettleTimeoutMs: undefined,
    });

    // Context missing the username variable value
    const context: ActCacheContext = {
      instruction: "type %username% into the field",
      cacheKey: "test-key",
      pageUrl: "https://example.com",
      variableKeys: ["username"],
      variables: {}, // Missing username value!
    };

    const result = await cache.tryReplay(context, {} as Page);

    // Should return null (cache miss)
    expect(result).toBeNull();

    // Should log the miss reason
    expect(logger).toHaveBeenCalledWith(
      expect.objectContaining({
        category: "cache",
        message: "act cache miss: missing variables for replay",
        level: 2,
      }),
    );
  });

  it("handles multiple variables correctly", async () => {
    const storage = {
      enabled: true,
      readJson: vi.fn(),
      writeJson: vi.fn().mockResolvedValue({}),
      directory: "/tmp/cache",
    } as unknown as CacheStorage;

    const cache = new ActCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => null as unknown as ActHandler,
      getDefaultLlmClient: () => ({}) as LLMClient,
      domSettleTimeoutMs: undefined,
    });

    const fakePage = {
      url: vi.fn().mockResolvedValue("https://example.com"),
    } as unknown as Page;

    // Context with multiple variables
    const context1 = await cache.prepareContext(
      "fill %username% and %password%",
      fakePage,
      { username: "user1", password: "pass1" },
    );

    const context2 = await cache.prepareContext(
      "fill %username% and %password%",
      fakePage,
      { username: "user2", password: "pass2" },
    );

    // Same cache key despite different values
    expect(context1?.cacheKey).toBe(context2?.cacheKey);

    // Variable keys should be sorted
    expect(context1?.variableKeys).toEqual(["password", "username"]);
    expect(context2?.variableKeys).toEqual(["password", "username"]);
  });
});


================================================
FILE: packages/core/tests/integration/agent-abort-signal.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { AgentAbortError } from "../../lib/v3/types/public/sdkErrors.js";

test.describe("Stagehand agent abort signal", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3({
      ...v3TestConfig,
      experimental: true,
    });
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("non-streaming: abort signal stops execution and throws AgentAbortError", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    const controller = new AbortController();

    // Abort after 500ms - should be enough for the LLM to start but not finish
    setTimeout(() => controller.abort(), 500);

    await expect(
      agent.execute({
        instruction:
          "Describe every visual element on this page in extreme detail. Describe at least 100 different elements.",
        maxSteps: 50,
        signal: controller.signal,
      }),
    ).rejects.toThrow(AgentAbortError);
  });

  test("streaming: abort signal stops stream and rejects result with AgentAbortError", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      stream: true,
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    const controller = new AbortController();

    // Abort after 500ms
    setTimeout(() => controller.abort(), 500);

    const streamResult = await agent.execute({
      instruction:
        "Describe every visual element on this page in extreme detail. Describe at least 100 different elements.",
      maxSteps: 50,
      signal: controller.signal,
    });

    // Handle both stream consumption and result promise together
    // The result promise will reject with AgentAbortError when aborted
    const consumeStream = async () => {
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume chunks until stream ends
      }
    };

    // Both should complete - stream ends and result rejects
    const [, resultError] = await Promise.allSettled([
      consumeStream(),
      streamResult.result,
    ]);

    // The result should have rejected with AgentAbortError
    expect(resultError.status).toBe("rejected");
    expect((resultError as PromiseRejectedResult).reason).toBeInstanceOf(
      AgentAbortError,
    );
  });

  test("non-streaming: already aborted signal throws AgentAbortError immediately", async () => {
    test.setTimeout(20000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    // Create an already aborted controller
    const controller = new AbortController();
    controller.abort();

    await expect(
      agent.execute({
        instruction: "This should not run.",
        maxSteps: 3,
        signal: controller.signal,
      }),
    ).rejects.toThrow(AgentAbortError);
  });

  test("non-streaming: execution completes normally without abort signal", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    // No signal provided - should complete normally
    const result = await agent.execute({
      instruction: "Describe this page briefly.",
      maxSteps: 3,
    });

    expect(result.success).toBe(true);
    expect(result.completed).toBe(true);
  });

  test("streaming: execution completes normally without abort signal", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      stream: true,
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    // No signal provided - should complete normally
    const streamResult = await agent.execute({
      instruction: "Describe this page briefly.",
      maxSteps: 3,
    });

    // Consume the stream first
    // eslint-disable-next-line @typescript-eslint/no-unused-vars
    for await (const _ of streamResult.textStream) {
      // Just consume
    }

    // Now get the final result
    const result = await streamResult.result;

    expect(result.success).toBe(true);
    expect(result.completed).toBe(true);
  });
});


================================================
FILE: packages/core/tests/integration/agent-cache-self-heal.spec.ts
================================================
import { test, expect } from "@playwright/test";
import fs from "fs/promises";
import path from "path";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import type {
  AgentReplayActStep,
  AgentReplayFillFormStep,
  CachedAgentEntry,
} from "../../lib/v3/types/private/cache.js";

test.describe("Agent cache self-heal (e2e)", () => {
  let v3: V3;
  let cacheDir: string;

  // eslint-disable-next-line no-empty-pattern
  test.beforeEach(async ({}, testInfo) => {
    await fs.mkdir(testInfo.outputDir, { recursive: true });
    cacheDir = await fs.mkdtemp(path.join(testInfo.outputDir, "agent-cache-"));
    v3 = new V3({
      ...v3TestConfig,
      cacheDir,
      selfHeal: true,
    });
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("replays heal corrupted selectors", async () => {
    test.setTimeout(120_000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });
    const page = v3.context.pages()[0];
    const url =
      "https://browserbase.github.io/stagehand-eval-sites/sites/shadow-dom/";
    const instruction = "click the button";

    await page.goto(url, { waitUntil: "networkidle" });
    const firstResult = await agent.execute({ instruction, maxSteps: 20 });
    expect(firstResult.success).toBe(true);

    const cachePath = await locateAgentCacheFile(cacheDir);
    const originalEntry = await readCacheEntry(cachePath);
    const originalActionStep = findFirstActionStep(originalEntry);
    expect(originalActionStep).toBeDefined();
    const originalSelector = originalActionStep?.actions?.[0]?.selector;
    expect(typeof originalSelector).toBe("string");

    // Corrupt the cached selector so the replay needs to self-heal.
    if (originalActionStep?.actions?.[0]) {
      originalActionStep.actions[0].selector = "xpath=/yeee";
    }
    await fs.writeFile(
      cachePath,
      JSON.stringify(originalEntry, null, 2),
      "utf8",
    );

    // Second run should replay from cache, self-heal, and update the file.
    await page.goto(url, { waitUntil: "networkidle" });
    const replayResult = await agent.execute({ instruction, maxSteps: 20 });
    expect(replayResult.success).toBe(true);

    const healedEntry = await readCacheEntry(cachePath);
    const healedActionStep = findFirstActionStep(healedEntry);
    expect(healedActionStep?.actions?.[0]?.selector).toBe(originalSelector);
    expect(healedActionStep?.actions?.[0]?.selector).not.toBe("xpath=/yeee");
    expect(healedEntry.timestamp).not.toBe(originalEntry.timestamp);
  });
});

async function locateAgentCacheFile(cacheDir: string): Promise<string> {
  const deadline = Date.now() + 10_000;
  while (Date.now() < deadline) {
    const entries = await fs.readdir(cacheDir);
    const agentFiles = entries.filter((file) => file.startsWith("agent-"));
    if (agentFiles.length > 0) {
      return path.join(cacheDir, agentFiles[0]!);
    }
    await new Promise((resolve) => setTimeout(resolve, 200));
  }
  throw new Error("Timed out waiting for agent cache entry to be written");
}

async function readCacheEntry(cachePath: string): Promise<CachedAgentEntry> {
  const raw = await fs.readFile(cachePath, "utf8");
  return JSON.parse(raw) as CachedAgentEntry;
}

type StepWithActions = AgentReplayActStep | AgentReplayFillFormStep;

function findFirstActionStep(
  entry: CachedAgentEntry,
): StepWithActions | undefined {
  return entry.steps.find((step) => {
    const actions = (step as StepWithActions).actions;
    return Array.isArray(actions) && actions.length > 0;
  }) as StepWithActions | undefined;
}


================================================
FILE: packages/core/tests/integration/agent-callbacks.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import type { StepResult, ToolSet } from "ai";
import { StreamingCallbacksInNonStreamingModeError } from "../../lib/v3/types/public/sdkErrors.js";

test.describe("Stagehand agent callbacks behavior", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3({
      ...v3TestConfig,
      experimental: true, // Required for callbacks and streaming
    });
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test.describe("Non-streaming callbacks (stream: false)", () => {
    test("onStepFinish callback is called for each step", async () => {
      test.setTimeout(60000);

      const stepFinishEvents: StepResult<ToolSet>[] = [];

      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      await agent.execute({
        instruction:
          "What is the title of this page? Mark the task as complete after answering.",
        maxSteps: 5,
        callbacks: {
          onStepFinish: async (event) => {
            stepFinishEvents.push(event);
          },
        },
      });

      // Should have at least one step finish event
      expect(stepFinishEvents.length).toBeGreaterThan(0);

      // Each event should have expected properties
      for (const event of stepFinishEvents) {
        expect(event).toHaveProperty("finishReason");
        expect(event).toHaveProperty("text");
      }
    });

    test("prepareStep callback is called before each step", async () => {
      test.setTimeout(60000);

      let prepareStepCallCount = 0;

      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      await agent.execute({
        instruction: "Simply describe the page briefly.",
        maxSteps: 3,
        callbacks: {
          prepareStep: async (stepContext) => {
            prepareStepCallCount++;
            return stepContext;
          },
        },
      });

      // prepareStep should have been called at least once
      expect(prepareStepCallCount).toBeGreaterThan(0);
    });

    test("callbacks receive tool call information", async () => {
      test.setTimeout(60000);

      const toolCalls: Array<{ toolName: string; input: unknown }> = [];

      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      await agent.execute({
        instruction:
          "Take a screenshot and describe what you see briefly. Then mark the task as complete.",
        maxSteps: 3,
        callbacks: {
          onStepFinish: async (event) => {
            if (event.toolCalls) {
              for (const tc of event.toolCalls) {
                toolCalls.push({
                  toolName: tc.toolName,
                  input: tc.input,
                });
              }
            }
          },
        },
      });

      // Should have captured at least one tool call (e.g. screenshot)
      expect(toolCalls.length).toBeGreaterThan(0);
      expect(
        toolCalls.some(
          (tc) => tc.toolName === "screenshot" || tc.toolName === "ariaTree",
        ),
      ).toBe(true);
    });
  });

  test.describe("Streaming callbacks (stream: true)", () => {
    test("onStepFinish callback is called for each step in stream mode", async () => {
      test.setTimeout(60000);

      const stepFinishEvents: StepResult<ToolSet>[] = [];

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "What is this page? Describe it briefly.",
        maxSteps: 5,
        callbacks: {
          onStepFinish: async (event) => {
            stepFinishEvents.push(event);
          },
        },
      });

      // Consume the stream
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume
      }

      // Wait for result to complete
      await streamResult.result;

      // Should have at least one step finish event
      expect(stepFinishEvents.length).toBeGreaterThan(0);
    });

    test("onChunk callback is called for each chunk", async () => {
      test.setTimeout(60000);

      let chunkCount = 0;

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "Say hello briefly and describe the page.",
        maxSteps: 3,
        callbacks: {
          onChunk: async () => {
            chunkCount++;
          },
        },
      });

      // Consume the stream
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume
      }

      await streamResult.result;

      // Should have received chunks
      expect(chunkCount).toBeGreaterThan(0);
    });

    test("onFinish callback is called when stream completes", async () => {
      test.setTimeout(60000);

      let finishCalled = false;
      let finishEvent: unknown = null;

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "Simply describe the page briefly.",
        maxSteps: 3,
        callbacks: {
          onFinish: (event) => {
            finishCalled = true;
            finishEvent = event;
          },
        },
      });

      // Consume the stream
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume
      }

      await streamResult.result;

      // onFinish should have been called
      expect(finishCalled).toBe(true);
      expect(finishEvent).not.toBeNull();
    });

    test("prepareStep callback works in stream mode", async () => {
      test.setTimeout(60000);

      let prepareStepCallCount = 0;

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "Simply describe the page briefly.",
        maxSteps: 3,
        callbacks: {
          prepareStep: async (stepContext) => {
            prepareStepCallCount++;
            return stepContext;
          },
        },
      });

      // Consume the stream
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume
      }

      await streamResult.result;

      // prepareStep should have been called at least once
      expect(prepareStepCallCount).toBeGreaterThan(0);
    });
  });

  test.describe("Streaming-only callbacks runtime validation", () => {
    test("throws StreamingCallbacksInNonStreamingModeError when onChunk is used", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      try {
        await agent.execute({
          instruction: "test",
          callbacks: {
            onChunk: (() => {}) as never,
          },
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StreamingCallbacksInNonStreamingModeError);
        expect(
          (error as StreamingCallbacksInNonStreamingModeError).invalidCallbacks,
        ).toEqual(["onChunk"]);
      }
    });

    test("throws StreamingCallbacksInNonStreamingModeError when onFinish is used", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      try {
        await agent.execute({
          instruction: "test",
          callbacks: {
            onFinish: (() => {}) as never,
          },
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StreamingCallbacksInNonStreamingModeError);
        expect(
          (error as StreamingCallbacksInNonStreamingModeError).invalidCallbacks,
        ).toEqual(["onFinish"]);
      }
    });

    test("throws StreamingCallbacksInNonStreamingModeError when onError is used", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      try {
        await agent.execute({
          instruction: "test",
          callbacks: {
            onError: (() => {}) as never,
          },
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StreamingCallbacksInNonStreamingModeError);
        expect(
          (error as StreamingCallbacksInNonStreamingModeError).invalidCallbacks,
        ).toEqual(["onError"]);
      }
    });

    test("throws StreamingCallbacksInNonStreamingModeError when onAbort is used", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      try {
        await agent.execute({
          instruction: "test",
          callbacks: {
            onAbort: (() => {}) as never,
          },
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StreamingCallbacksInNonStreamingModeError);
        expect(
          (error as StreamingCallbacksInNonStreamingModeError).invalidCallbacks,
        ).toEqual(["onAbort"]);
      }
    });

    test("error includes all invalid callbacks when multiple are used", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      try {
        await agent.execute({
          instruction: "test",
          callbacks: {
            onChunk: (() => {}) as never,
            onFinish: (() => {}) as never,
          },
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StreamingCallbacksInNonStreamingModeError);
        expect(
          (error as StreamingCallbacksInNonStreamingModeError).invalidCallbacks,
        ).toEqual(["onChunk", "onFinish"]);
      }
    });
  });

  test.describe("Combined callbacks", () => {
    test("multiple callbacks can be used together", async () => {
      test.setTimeout(60000);

      let prepareStepCount = 0;
      let stepFinishCount = 0;

      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      await agent.execute({
        instruction: "Simply describe the page briefly.",
        maxSteps: 3,
        callbacks: {
          prepareStep: async (stepContext) => {
            prepareStepCount++;
            return stepContext;
          },
          onStepFinish: async () => {
            stepFinishCount++;
          },
        },
      });

      // Both callbacks should have been called
      expect(prepareStepCount).toBeGreaterThan(0);
      expect(stepFinishCount).toBeGreaterThan(0);
    });

    test("streaming with multiple callbacks", async () => {
      test.setTimeout(60000);

      let prepareStepCount = 0;
      let stepFinishCount = 0;
      let chunkCount = 0;
      let finishCalled = false;

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "Say hello briefly and describe the page.",
        maxSteps: 3,
        callbacks: {
          prepareStep: async (stepContext) => {
            prepareStepCount++;
            return stepContext;
          },
          onStepFinish: async () => {
            stepFinishCount++;
          },
          onChunk: async () => {
            chunkCount++;
          },
          onFinish: () => {
            finishCalled = true;
          },
        },
      });

      // Consume the stream
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume
      }

      await streamResult.result;

      // All callbacks should have been called
      expect(prepareStepCount).toBeGreaterThan(0);
      expect(stepFinishCount).toBeGreaterThan(0);
      expect(chunkCount).toBeGreaterThan(0);
      expect(finishCalled).toBe(true);
    });
  });
});


================================================
FILE: packages/core/tests/integration/agent-captcha-autosolve.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { getV3TestConfig } from "./v3.config.js";
import type { LogLine } from "../../lib/v3/types/public/logs.js";

const isBrowserbase =
  (process.env.STAGEHAND_BROWSER_TARGET ?? "local").toLowerCase() ===
  "browserbase";

test.describe("Agent captcha auto-solve on Browserbase", () => {
  test.skip(!isBrowserbase, "Requires Browserbase environment");

  let v3: V3;
  let logs: LogLine[];

  test.beforeEach(async () => {
    logs = [];
    v3 = new V3(
      getV3TestConfig({
        env: "BROWSERBASE",
        verbose: 2,
        logger: (line: LogLine) => {
          logs.push(line);
          console.log(`[${line.category}] ${line.message}`);
        },
        browserbaseSessionCreateParams: {
          browserSettings: {
            solveCaptchas: true,
          },
        },
      }),
    );
    await v3.init();
    console.log("BB session URL:", v3.browserbaseSessionURL);
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("reCAPTCHA v2 auto-solve (Google demo)", async () => {
    test.setTimeout(180_000);
    const page = v3.context.pages()[0];
    // Google's official reCAPTCHA v2 demo — same URL the stealth team tests.
    // Use domcontentloaded since BB's route interception can delay full load.
    await page.goto("https://www.google.com/recaptcha/api2/demo", {
      waitUntil: "domcontentloaded",
    });

    // Give BB time to intercept the anchor request and solve the captcha
    await new Promise((r) => setTimeout(r, 30_000));

    const agent = v3.agent({
      mode: "dom",
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const result = await agent.execute({
      instruction:
        'Click the "Submit" button and report the exact text shown on the result page.',
      maxSteps: 15,
    });

    console.log("reCAPTCHA v2 result:", result.message);

    expect(result.completed).toBe(true);
    expect(result.message.toLowerCase()).toContain("success");
  });
});


================================================
FILE: packages/core/tests/integration/agent-experimental-validation.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { z } from "zod";
import { tool } from "ai";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import {
  ExperimentalNotConfiguredError,
  StagehandInvalidArgumentError,
} from "../../lib/v3/types/public/sdkErrors.js";

// Define a mock custom tool for testing
const mockCustomTool = tool({
  description: "A mock tool for testing",
  inputSchema: z.object({
    input: z.string().describe("The input string"),
  }),
  execute: async ({ input }) => {
    return `Processed: ${input}`;
  },
});

test.describe("Stagehand agent experimental feature validation", () => {
  test.describe("Invalid argument errors", () => {
    let v3: V3;

    test.beforeEach(async () => {
      v3 = new V3({
        ...v3TestConfig,
        experimental: false,
      });
      await v3.init();
    });

    test.afterEach(async () => {
      await v3?.close?.().catch(() => {});
    });

    test("throws StagehandInvalidArgumentError when CUA and streaming are both enabled", async () => {
      try {
        v3.agent({
          cua: true,
          stream: true,
          model: "anthropic/claude-sonnet-4-20250514",
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StagehandInvalidArgumentError);
        expect((error as Error).message).toContain("streaming");
        expect((error as Error).message).toContain("not supported with CUA");
      }
    });

    test("throws StagehandInvalidArgumentError for CUA + streaming even with experimental: true", async () => {
      // Close the non-experimental instance
      await v3.close();

      // Create an experimental instance
      const v3Experimental = new V3({
        ...v3TestConfig,
        experimental: true,
      });
      await v3Experimental.init();

      try {
        v3Experimental.agent({
          cua: true,
          stream: true,
          model: "anthropic/claude-sonnet-4-20250514",
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StagehandInvalidArgumentError);
        expect((error as Error).message).toContain("streaming");
        expect((error as Error).message).toContain("not supported with CUA");
      } finally {
        await v3Experimental.close();
      }
    });
  });

  test.describe("Experimental feature errors without experimental: true", () => {
    let v3: V3;

    test.beforeEach(async () => {
      v3 = new V3({
        ...v3TestConfig,
        experimental: false,
      });
      await v3.init();
    });

    test.afterEach(async () => {
      await v3?.close?.().catch(() => {});
    });

    test("throws ExperimentalNotConfiguredError for MCP integrations", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-sonnet-4-20250514",
        integrations: ["https://mcp.example.com"],
      });

      try {
        await agent.execute("test");
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain(
          "MCP integrations and custom tools",
        );
      }
    });

    test("throws ExperimentalNotConfiguredError for custom tools", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-sonnet-4-20250514",
        tools: {
          mockCustomTool,
        },
      });

      try {
        await agent.execute("test");
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain(
          "MCP integrations and custom tools",
        );
      }
    });

    test("throws ExperimentalNotConfiguredError for streaming mode", async () => {
      try {
        const agent = v3.agent({
          stream: true,
          model: "anthropic/claude-sonnet-4-20250514",
        });
        await agent.execute("test instruction");
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain("streaming");
      }
    });

    test("throws ExperimentalNotConfiguredError for callbacks", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-sonnet-4-20250514",
      });

      try {
        await agent.execute({
          instruction: "test",
          callbacks: {
            onStepFinish: async () => {},
          },
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain("callbacks");
      }
    });

    test("throws ExperimentalNotConfiguredError for abort signal", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-sonnet-4-20250514",
      });

      const controller = new AbortController();
      try {
        await agent.execute({
          instruction: "test",
          signal: controller.signal,
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain("abort signal");
      }
    });

    test("throws ExperimentalNotConfiguredError for message continuation", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-sonnet-4-20250514",
      });

      try {
        await agent.execute({
          instruction: "test",
          messages: [{ role: "user", content: "previous message" }],
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain("message continuation");
      }
    });

    test("throws ExperimentalNotConfiguredError listing multiple features", async () => {
      const agent = v3.agent({
        model: "anthropic/claude-sonnet-4-20250514",
      });

      const controller = new AbortController();
      try {
        await agent.execute({
          instruction: "test",
          callbacks: { onStepFinish: async () => {} },
          signal: controller.signal,
          messages: [{ role: "user", content: "previous" }],
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        const message = (error as Error).message;
        expect(message).toContain("callbacks");
        expect(message).toContain("abort signal");
        expect(message).toContain("message continuation");
      }
    });
  });

  test.describe("CUA agent unsupported features", () => {
    let v3: V3;

    test.beforeEach(async () => {
      v3 = new V3({
        ...v3TestConfig,
        experimental: false,
      });
      await v3.init();
    });

    test.afterEach(async () => {
      await v3?.close?.().catch(() => {});
    });

    test("throws ExperimentalNotConfiguredError for CUA with integrations", async () => {
      // MCP integrations are still an experimental feature check (not unsupported)
      try {
        v3.agent({
          cua: true,
          model: "anthropic/claude-sonnet-4-20250514",
          integrations: ["https://mcp.example.com"],
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(ExperimentalNotConfiguredError);
        expect((error as Error).message).toContain(
          "MCP integrations and custom tools",
        );
      }
    });

    test("throws StagehandInvalidArgumentError for CUA with abort signal (not supported)", async () => {
      const agent = v3.agent({
        cua: true,
        model: "anthropic/claude-sonnet-4-20250514",
      });

      const controller = new AbortController();
      try {
        await agent.execute({
          instruction: "test",
          signal: controller.signal,
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StagehandInvalidArgumentError);
        expect((error as Error).message).toContain("abort signal");
        expect((error as Error).message).toContain("not supported with CUA");
      }
    });

    test("throws StagehandInvalidArgumentError for CUA with message continuation (not supported)", async () => {
      const agent = v3.agent({
        cua: true,
        model: "anthropic/claude-sonnet-4-20250514",
      });

      try {
        await agent.execute({
          instruction: "test",
          messages: [{ role: "user", content: "previous message" }],
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StagehandInvalidArgumentError);
        expect((error as Error).message).toContain("message continuation");
        expect((error as Error).message).toContain("not supported with CUA");
      }
    });

    test("throws StagehandInvalidArgumentError for CUA with multiple unsupported features", async () => {
      const agent = v3.agent({
        cua: true,
        model: "anthropic/claude-sonnet-4-20250514",
      });

      const controller = new AbortController();
      try {
        await agent.execute({
          instruction: "test",
          signal: controller.signal,
          messages: [{ role: "user", content: "previous message" }],
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StagehandInvalidArgumentError);
        const message = (error as Error).message;
        expect(message).toContain("abort signal");
        expect(message).toContain("message continuation");
        expect(message).toContain("are not supported with CUA");
      }
    });

    test("throws StagehandInvalidArgumentError for CUA unsupported features even with experimental: true", async () => {
      // Close the non-experimental instance
      await v3.close();

      // Create an experimental instance
      const v3Experimental = new V3({
        ...v3TestConfig,
        experimental: true,
      });
      await v3Experimental.init();

      const agent = v3Experimental.agent({
        cua: true,
        model: "anthropic/claude-sonnet-4-20250514",
      });

      const controller = new AbortController();
      try {
        await agent.execute({
          instruction: "test",
          signal: controller.signal,
        });
        throw new Error("Expected error to be thrown");
      } catch (error) {
        expect(error).toBeInstanceOf(StagehandInvalidArgumentError);
        expect((error as Error).message).toContain("not supported with CUA");
      } finally {
        await v3Experimental.close();
      }
    });
  });

  test.describe("Valid configurations with experimental: true", () => {
    let v3: V3;

    test.beforeEach(async () => {
      v3 = new V3({
        ...v3TestConfig,
        experimental: true,
      });
      await v3.init();
    });

    test.afterEach(async () => {
      await v3?.close?.().catch(() => {});
    });

    test("allows CUA without streaming", () => {
      expect(() =>
        v3.agent({
          cua: true,
          model: "anthropic/claude-sonnet-4-20250514",
        }),
      ).not.toThrow();
    });

    test("allows streaming mode", () => {
      expect(() =>
        v3.agent({
          stream: true,
          model: "anthropic/claude-sonnet-4-20250514",
        }),
      ).not.toThrow();
    });

    test("allows basic agent without experimental features", async () => {
      const v3NonExperimental = new V3({
        ...v3TestConfig,
        experimental: false,
      });
      await v3NonExperimental.init();

      try {
        // This should work - just creating a basic agent with no experimental features
        expect(() =>
          v3NonExperimental.agent({
            model: "anthropic/claude-sonnet-4-20250514",
          }),
        ).not.toThrow();
      } finally {
        await v3NonExperimental.close();
      }
    });
  });
});


================================================
FILE: packages/core/tests/integration/agent-hybrid-mode.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { createAgentTools } from "../../lib/v3/agent/tools/index.js";
import { buildAgentSystemPrompt } from "../../lib/v3/agent/prompts/agentSystemPrompt.js";
import type { StepResult, ToolSet } from "ai";

test.describe("Stagehand agent hybrid mode", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3({
      ...v3TestConfig,
      experimental: true,
    });
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test.describe("Tool filtering by mode", () => {
    test("DOM mode includes DOM-based tools and excludes coordinate-based tools", () => {
      const tools = createAgentTools(v3, { mode: "dom" });

      // DOM mode should have these tools
      expect(tools).toHaveProperty("act");
      expect(tools).toHaveProperty("fillForm");
      expect(tools).toHaveProperty("ariaTree");
      expect(tools).toHaveProperty("screenshot");
      expect(tools).toHaveProperty("extract");
      expect(tools).toHaveProperty("goto");
      expect(tools).toHaveProperty("scroll");
      expect(tools).toHaveProperty("wait");
      expect(tools).toHaveProperty("navback");
      expect(tools).toHaveProperty("keys");
      expect(tools).toHaveProperty("think");

      // DOM mode should NOT have coordinate-based tools
      expect(tools).not.toHaveProperty("click");
      expect(tools).not.toHaveProperty("type");
      expect(tools).not.toHaveProperty("dragAndDrop");
      expect(tools).not.toHaveProperty("clickAndHold");
      expect(tools).not.toHaveProperty("fillFormVision");
    });

    test("Hybrid mode includes coordinate-based tools and excludes DOM fillForm", () => {
      const tools = createAgentTools(v3, { mode: "hybrid" });

      // Hybrid mode should have coordinate-based tools
      expect(tools).toHaveProperty("click");
      expect(tools).toHaveProperty("type");
      expect(tools).toHaveProperty("dragAndDrop");
      expect(tools).toHaveProperty("clickAndHold");
      expect(tools).toHaveProperty("fillFormVision");

      // Hybrid mode should also have common tools
      expect(tools).toHaveProperty("act");
      expect(tools).toHaveProperty("ariaTree");
      expect(tools).toHaveProperty("screenshot");
      expect(tools).toHaveProperty("extract");
      expect(tools).toHaveProperty("goto");
      expect(tools).toHaveProperty("scroll");
      expect(tools).toHaveProperty("wait");
      expect(tools).toHaveProperty("navback");
      expect(tools).toHaveProperty("keys");
      expect(tools).toHaveProperty("think");

      // Hybrid mode should NOT have DOM-based fillForm
      expect(tools).not.toHaveProperty("fillForm");
    });

    test("Default mode is DOM when not specified", () => {
      const tools = createAgentTools(v3, {});

      // Should behave like DOM mode
      expect(tools).toHaveProperty("fillForm");
      expect(tools).not.toHaveProperty("click");
      expect(tools).not.toHaveProperty("type");
    });
  });

  test.describe("System prompt generation", () => {
    test("DOM mode system prompt emphasizes ariaTree and act tool", () => {
      const prompt = buildAgentSystemPrompt({
        url: "https://example.com",
        executionInstruction: "Test instruction",
        mode: "dom",
      });

      // DOM mode should prioritize ariaTree
      expect(prompt).toContain("ariaTree");
      expect(prompt).toContain("act");
      expect(prompt).toContain("fillForm");

      // Should have DOM-specific strategy
      expect(prompt).toContain("Use act tool for all clicking and typing");
      expect(prompt).toContain("Always check ariaTree first");
    });

    test("Hybrid mode system prompt emphasizes screenshot and coordinate tools", () => {
      const prompt = buildAgentSystemPrompt({
        url: "https://example.com",
        executionInstruction: "Test instruction",
        mode: "hybrid",
      });

      // Hybrid mode should have coordinate-based tools mentioned
      expect(prompt).toContain("click");
      expect(prompt).toContain("type");
      expect(prompt).toContain("fillFormVision");
      expect(prompt).toContain("dragAndDrop");

      // Should have hybrid-specific strategy
      expect(prompt).toContain(
        "Use specific tools (click, type) when elements are visible",
      );
      expect(prompt).toContain("Always use screenshot");
    });

    test("System prompt includes custom instructions when provided", () => {
      const customInstructions = "Always be polite and thorough";
      const prompt = buildAgentSystemPrompt({
        url: "https://example.com",
        executionInstruction: "Test instruction",
        mode: "dom",
        systemInstructions: customInstructions,
      });

      expect(prompt).toContain("customInstructions");
      expect(prompt).toContain(customInstructions);
    });

    test("System prompt includes captcha instructions when captchasAutoSolve is true", () => {
      const prompt = buildAgentSystemPrompt({
        url: "https://example.com",
        executionInstruction: "Test instruction",
        mode: "dom",
        captchasAutoSolve: true,
      });

      expect(prompt).toContain("captcha");
      expect(prompt).toContain("automatically detected and solved");
    });

    test("System prompt does not include captcha instructions when captchasAutoSolve is false", () => {
      const prompt = buildAgentSystemPrompt({
        url: "https://example.com",
        executionInstruction: "Test instruction",
        mode: "dom",
        captchasAutoSolve: false,
      });

      expect(prompt).not.toContain("automatically detected and solved");
    });
  });

  test.describe("Agent creation with mode", () => {
    test("agent({ mode: 'dom' }) creates DOM-mode agent", () => {
      const agent = v3.agent({
        mode: "dom",
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      expect(agent).toHaveProperty("execute");
    });

    test("agent({ mode: 'hybrid' }) creates hybrid-mode agent", () => {
      const agent = v3.agent({
        mode: "hybrid",
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      expect(agent).toHaveProperty("execute");
    });

    test("agent without mode defaults to DOM mode", () => {
      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      expect(agent).toHaveProperty("execute");
    });

    test("hybrid mode can be combined with streaming", () => {
      const agent = v3.agent({
        mode: "hybrid",
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      expect(agent).toHaveProperty("execute");
    });
  });

  test.describe("Hybrid mode execution", () => {
    test("hybrid mode agent uses coordinate-based tools when available", async () => {
      test.setTimeout(90000);

      const toolCalls: Array<{ toolName: string; input: unknown }> = [];

      const agent = v3.agent({
        mode: "hybrid",
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      await agent.execute({
        instruction:
          "Take a screenshot to see the page, then describe what you see briefly and mark the task as complete.",
        maxSteps: 5,
        callbacks: {
          onStepFinish: async (event: StepResult<ToolSet>) => {
            if (event.toolCalls) {
              for (const tc of event.toolCalls) {
                toolCalls.push({
                  toolName: tc.toolName,
                  input: tc.input,
                });
              }
            }
          },
        },
      });

      // Should have captured tool calls
      expect(toolCalls.length).toBeGreaterThan(0);

      const toolNames = toolCalls.map((tc) => tc.toolName);
      // Should include screenshot (hybrid mode emphasizes visual)
      expect(toolNames).toContain("screenshot");
    });

    test("DOM mode agent uses DOM-based tools", async () => {
      test.setTimeout(90000);

      const toolCalls: Array<{ toolName: string; input: unknown }> = [];

      const agent = v3.agent({
        mode: "dom",
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      await agent.execute({
        instruction:
          "Use the ariaTree to understand the page, then provide the final requested output or a summary of the page.",
        maxSteps: 5,
        callbacks: {
          onStepFinish: async (event: StepResult<ToolSet>) => {
            if (event.toolCalls) {
              for (const tc of event.toolCalls) {
                toolCalls.push({
                  toolName: tc.toolName,
                  input: tc.input,
                });
              }
            }
          },
        },
      });

      // Should have captured tool calls
      expect(toolCalls.length).toBeGreaterThan(0);

      // Should include ariaTree (DOM mode emphasizes aria-based interaction)
      const toolNames = toolCalls.map((tc) => tc.toolName);
      expect(toolNames).toContain("ariaTree");
    });
  });

  test.describe("Scroll tool variants by mode", () => {
    test("DOM mode uses simple scroll tool without coordinates", () => {
      const tools = createAgentTools(v3, { mode: "dom" });

      expect(tools).toHaveProperty("scroll");
      // The DOM scroll tool should exist
      expect(typeof tools.scroll).toBe("object");
    });

    test("Hybrid mode uses vision scroll tool with optional coordinates", () => {
      const tools = createAgentTools(v3, { mode: "hybrid" });

      expect(tools).toHaveProperty("scroll");
      // The hybrid scroll tool should exist
      expect(typeof tools.scroll).toBe("object");
    });
  });

  test.describe("Keys tool availability in both modes", () => {
    test("Keys tool is available in DOM mode", () => {
      const tools = createAgentTools(v3, { mode: "dom" });
      expect(tools).toHaveProperty("keys");
    });

    test("Keys tool is available in hybrid mode", () => {
      const tools = createAgentTools(v3, { mode: "hybrid" });
      expect(tools).toHaveProperty("keys");
    });
  });

  test.describe("Think tool availability", () => {
    test("Think tool is available in DOM mode", () => {
      const tools = createAgentTools(v3, { mode: "dom" });
      expect(tools).toHaveProperty("think");
    });

    test("Think tool is available in hybrid mode", () => {
      const tools = createAgentTools(v3, { mode: "hybrid" });
      expect(tools).toHaveProperty("think");
    });
  });
});


================================================
FILE: packages/core/tests/integration/agent-message-continuation.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import type { ModelMessage } from "ai";

test.describe("Stagehand agent message continuation", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3({
      ...v3TestConfig,
      experimental: true,
    });
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("execute returns messages in the result", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    const result = await agent.execute({
      instruction: "What is the title of this page? Describe it briefly.",
      maxSteps: 5,
    });

    // Result should contain messages
    expect(result.messages).toBeDefined();
    expect(Array.isArray(result.messages)).toBe(true);
    expect(result.messages!.length).toBeGreaterThan(0);

    // First message should be the user instruction
    const firstMessage = result.messages![0];
    expect(firstMessage.role).toBe("user");
  });

  test("can continue conversation with previous messages", async () => {
    test.setTimeout(120000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    // First execution
    const result1 = await agent.execute({
      instruction: "What is the title of this page? Describe it briefly.",
      maxSteps: 5,
    });

    expect(result1.messages).toBeDefined();
    expect(result1.messages!.length).toBeGreaterThan(0);

    // Second execution continuing from first
    const result2 = await agent.execute({
      instruction:
        "Based on what you just told me, is this a simple or complex website? Answer briefly.",
      maxSteps: 5,
      messages: result1.messages,
    });

    expect(result2.messages).toBeDefined();
    // Second result should have more messages (includes first conversation)
    expect(result2.messages!.length).toBeGreaterThan(result1.messages!.length);
  });

  test("messages include tool calls and results", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    const result = await agent.execute({
      instruction:
        "Use the ariaTree tool to see the page, then describe what you found briefly.",
      maxSteps: 5,
    });

    expect(result.messages).toBeDefined();

    // Verify there are assistant messages
    const assistantMessages = result.messages!.filter(
      (m: ModelMessage) => m.role === "assistant",
    );
    expect(assistantMessages.length).toBeGreaterThan(0);

    // Verify at least one assistant message contains tool calls
    const hasToolCalls = assistantMessages.some((m: ModelMessage) => {
      if (Array.isArray(m.content)) {
        return m.content.some(
          (part) => typeof part === "object" && part.type === "tool-call",
        );
      }
      return false;
    });
    expect(hasToolCalls).toBe(true);

    // Verify there are tool result messages
    const hasToolResults = result.messages!.some(
      (m: ModelMessage) => m.role === "tool",
    );
    expect(hasToolResults).toBe(true);
  });

  test("streaming mode also returns messages", async () => {
    test.setTimeout(60000);

    const agent = v3.agent({
      stream: true,
      model: "anthropic/claude-haiku-4-5-20251001",
    });

    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    const streamResult = await agent.execute({
      instruction: "What is this page? Describe it briefly.",
      maxSteps: 5,
    });

    // Consume the stream
    // eslint-disable-next-line @typescript-eslint/no-unused-vars
    for await (const _ of streamResult.textStream) {
      // Just consume
    }

    const result = await streamResult.result;

    // Result should contain messages
    expect(result.messages).toBeDefined();
    expect(Array.isArray(result.messages)).toBe(true);
    expect(result.messages!.length).toBeGreaterThan(0);
  });
});


================================================
FILE: packages/core/tests/integration/agent-streaming.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import type { AgentResult } from "../../lib/v3/types/public/agent.js";

test.describe("Stagehand agent streaming behavior", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3({
      ...v3TestConfig,
      experimental: true, // Required for streaming
    });
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test.describe("agent({ stream: true })", () => {
    test("AgentStreamResult has textStream as async iterable", async () => {
      test.setTimeout(60000);

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      // Navigate to a simple page first
      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "What is the title of this page? Describe it briefly.",
        maxSteps: 3,
      });

      // Verify it's an AgentStreamResult with streaming capabilities
      expect(streamResult).toHaveProperty("textStream");
      expect(streamResult).toHaveProperty("result");

      // textStream should be async iterable
      expect(typeof streamResult.textStream[Symbol.asyncIterator]).toBe(
        "function",
      );

      // result should be a promise
      expect(streamResult.result).toBeInstanceOf(Promise);
    });

    test("textStream yields chunks incrementally", async () => {
      test.setTimeout(60000);

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "Say hello briefly.",
        maxSteps: 3,
      });

      // Collect chunks from the stream
      const chunks: string[] = [];
      for await (const chunk of streamResult.textStream) {
        chunks.push(chunk);
      }

      // Should have received at least some chunks (streaming behavior)
      // The exact content depends on the LLM response
      expect(Array.isArray(chunks)).toBe(true);
      expect(chunks.length).toBeGreaterThan(0);
    });

    test("result promise resolves to AgentResult after stream completes", async () => {
      test.setTimeout(60000);

      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const streamResult = await agent.execute({
        instruction: "What is this page about? Describe it briefly.",
        maxSteps: 5,
      });

      // Consume the stream first
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
      for await (const _ of streamResult.textStream) {
        // Just consume
      }

      // Now get the final result
      const finalResult: AgentResult = await streamResult.result;

      // Verify it's a proper AgentResult
      expect(finalResult).toHaveProperty("success");
      expect(finalResult).toHaveProperty("message");
      expect(finalResult).toHaveProperty("actions");
      expect(finalResult).toHaveProperty("completed");
      expect(typeof finalResult.success).toBe("boolean");
      expect(typeof finalResult.message).toBe("string");
      expect(Array.isArray(finalResult.actions)).toBe(true);
    });
  });

  test.describe("agent({ stream: false }) or agent()", () => {
    test("execute returns AgentResult without streaming properties", async () => {
      test.setTimeout(60000);

      const agent = v3.agent({
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      const page = v3.context.pages()[0];
      await page.goto("https://example.com");

      const result = await agent.execute({
        instruction: "What is this page? Describe it briefly.",
        maxSteps: 3,
      });
      // Should be AgentResult, not AgentStreamResult
      expect(result).toHaveProperty("success");
      expect(result).toHaveProperty("message");
      expect(result).toHaveProperty("actions");
      expect(result).toHaveProperty("completed");

      // Should NOT have streaming properties
      expect(result).not.toHaveProperty("textStream");
    });
  });

  test.describe("CUA disables streaming", () => {
    test("throws StagehandInvalidArgumentError when cua: true and stream: true", () => {
      expect(() => {
        v3.agent({
          cua: true,
          stream: true,
          model: "anthropic/claude-haiku-4-5-20251001",
        });
      }).toThrow("streaming is not supported with CUA");
    });

    test("allows cua: true without stream", () => {
      // Should not throw
      const agent = v3.agent({
        cua: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      expect(agent).toHaveProperty("execute");
    });

    test("allows stream: true without cua", () => {
      // Should not throw
      const agent = v3.agent({
        stream: true,
        model: "anthropic/claude-haiku-4-5-20251001",
      });

      expect(agent).toHaveProperty("execute");
    });
  });
});


================================================
FILE: packages/core/tests/integration/cdp-close-api-region.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { getV3TestConfig } from "./v3.config.js";
import { raceTimeout } from "./testUtils.js";

/**
 * Full production trigger chain:
 *
 *   v3.close()
 *     → apiClient.end()           (tells hosted API to kill the BB session)
 *     → hosted API terminates BB   (CDP WebSocket closes from server side)
 *     → ctx.close() → conn.close() (awaits "close" on already-CLOSED WS → hangs)
 *
 * Requires:
 *   - BROWSERBASE_API_KEY / BROWSERBASE_PROJECT_ID
 *   - The Stagehand hosted API to be reachable
 *   - A non-us-west-2 region (higher latency makes the race reliably trigger)
 */
test.describe("v3.close() with Stagehand API + non-default region", () => {
  test("close resolves instead of hanging", async () => {
    const apiKey = process.env.BROWSERBASE_API_KEY;
    const projectId = process.env.BROWSERBASE_PROJECT_ID;

    test.skip(
      !apiKey || !projectId,
      "BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID are required",
    );

    const v3 = new V3(
      getV3TestConfig({
        disableAPI: false,
        browserbaseSessionCreateParams: { region: "ap-southeast-1" },
      }),
    );

    await v3.init();

    // Verify the instance is functional.
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>api-region-test</body></html>");

    // Call v3.close() — the normal production shutdown path.
    // Internally: apiClient.end() → hosted API kills BB session →
    // CDP WebSocket closes → conn.close() tries to close already-closed WS.
    // Without the fix this hangs forever.
    const result = await raceTimeout(
      v3.close().then(() => "resolved" as const),
      30_000,
    );

    expect(result).toBe("resolved");
  });
});


================================================
FILE: packages/core/tests/integration/cdp-connection-close.spec.ts
================================================
import { test, expect } from "@playwright/test";
import WebSocket from "ws";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { raceTimeout } from "./testUtils.js";

test.describe("CdpConnection.close() after external WebSocket close", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    // Best-effort teardown – don't let a hung close block the suite.
    try {
      await raceTimeout(v3?.close?.(), 5_000);
    } catch {
      // ignore
    }
  });

  test("v3.close() resolves after the CDP WebSocket is already closed", async () => {
    // Verify the V3 instance is functional.
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>close-test</body></html>");

    const conn = v3.context.conn;

    // Unhook the V3-level _onCdpClosed handler so it doesn't trigger
    // _immediateShutdown in the background (we want to isolate the
    // CdpConnection.close() hang).
    // eslint-disable-next-line @typescript-eslint/no-explicit-any
    const onCdpClosed = (v3 as any)._onCdpClosed;
    if (onCdpClosed) {
      conn.offTransportClosed(onCdpClosed);
    }

    // Wait for the transport-close event to be fully processed.
    const transportClosed = new Promise<void>((resolve) => {
      conn.onTransportClosed(() => resolve());
    });

    // Terminate the underlying WebSocket – simulates the hosted API
    // killing the Browserbase session, which closes the CDP socket
    // from the server side.
    // eslint-disable-next-line @typescript-eslint/no-explicit-any
    const ws: WebSocket = (conn as any).ws;
    ws.terminate();

    await transportClosed;

    // Now call v3.close(). Internally this calls ctx.close() →
    // conn.close(), which awaits a "close" event on an already-CLOSED
    // WebSocket. Without the fix this promise never resolves.
    const result = await raceTimeout(
      v3.close().then(() => "resolved" as const),
      5_000,
    );

    expect(result).toBe("resolved");
  });

  test("inflight CDP calls reject when the WebSocket is terminated", async () => {
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>inflight-test</body></html>");

    const conn = v3.context.conn;

    // Unhook the V3-level handler as above.
    // eslint-disable-next-line @typescript-eslint/no-explicit-any
    const onCdpClosed = (v3 as any)._onCdpClosed;
    if (onCdpClosed) {
      conn.offTransportClosed(onCdpClosed);
    }

    // Send a long-running CDP call that the server will never answer.
    const pending = conn.send("Runtime.evaluate", {
      expression: "new Promise(r => setTimeout(() => r('done'), 60000))",
      awaitPromise: true,
    });

    // Terminate the WebSocket while the call is inflight.
    // eslint-disable-next-line @typescript-eslint/no-explicit-any
    const ws: WebSocket = (conn as any).ws;
    ws.terminate();

    // The pending promise must reject – not hang forever.
    const result = await raceTimeout(
      pending.then(() => "resolved" as const).catch(() => "rejected" as const),
      5_000,
    );

    expect(result).toBe("rejected");
  });
});


================================================
FILE: packages/core/tests/integration/cdp-session-detached.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { chromium as playwrightChromium } from "playwright";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("CDP session detach handling", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("rejects inflight CDP calls when a target is closed", async () => {
    const unhandled: unknown[] = [];
    const onUnhandled = (reason: unknown) => {
      unhandled.push(reason);
    };

    process.on("unhandledRejection", onUnhandled);

    let pwBrowser: Awaited<
      ReturnType<typeof playwrightChromium.connectOverCDP>
    > | null = null;

    try {
      pwBrowser = await playwrightChromium.connectOverCDP(v3.connectURL());
      const pwContext = pwBrowser.contexts()[0];
      const pwPage = pwContext.pages()[0];

      const v3Page = v3.context.pages()[0];
      await v3Page.goto("data:text/html,<html><body>cdp</body></html>");

      const pending = v3Page.sendCDP("Runtime.evaluate", {
        expression: "new Promise(r => setTimeout(() => r('done'), 5000))",
        awaitPromise: true,
        returnByValue: true,
      });

      await pwPage.close();

      await expect(pending).rejects.toThrow(
        /No Page found for target closed before CDP response/,
      );

      await new Promise((r) => setTimeout(r, 50));
      expect(unhandled).toHaveLength(0);
    } finally {
      process.off("unhandledRejection", onUnhandled);
      await pwBrowser?.close().catch(() => {});
    }
  });
});


================================================
FILE: packages/core/tests/integration/click-count.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

// Keep double-click verification event-based and deterministic.
// Time-delta counters (Date.now() between mousedowns) are flaky at ms boundaries
// and can miss valid double-clicks when synthetic input lands in the same millisecond.
const doubleClickFixtureUrl = `data:text/html,${encodeURIComponent(`<!DOCTYPE html>
<html>
  <body>
    <div id="target" style="width: 240px; height: 120px; border: 1px solid #000;">target</div>
    <input id="clickCount" value="0" readonly />
    <input id="dblClickCount" value="0" readonly />
    <input id="lastClickDetail" value="0" readonly />
    <input id="lastDblClickDetail" value="0" readonly />
    <script>
      const target = document.getElementById("target");
      const clickCount = document.getElementById("clickCount");
      const dblClickCount = document.getElementById("dblClickCount");
      const lastClickDetail = document.getElementById("lastClickDetail");
      const lastDblClickDetail = document.getElementById("lastDblClickDetail");
      let clicks = 0;
      let dblClicks = 0;

      target.addEventListener("click", (event) => {
        clicks += 1;
        clickCount.value = String(clicks);
        lastClickDetail.value = String(event.detail);
      });

      target.addEventListener("dblclick", (event) => {
        dblClicks += 1;
        dblClickCount.value = String(dblClicks);
        lastDblClickDetail.value = String(event.detail);
      });
    </script>
  </body>
</html>`)}`;

test.describe("Locator and Page click methods", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("locator.click() performs single click by default", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/click-test/",
    );

    // Wait for page to be fully loaded
    await page.waitForLoadState("domcontentloaded");

    // Get initial count
    const countDisplay = page.locator("#count");
    const initialCount = await countDisplay.inputValue();
    expect(initialCount).toBe("0");

    // Perform single click on the textarea (the clickable area)
    const clickArea = page.locator("#textarea");
    await clickArea.click();

    // Verify count incremented by 1
    const newCount = await countDisplay.inputValue();
    expect(newCount).toBe("1");
  });

  test("locator.click() with clickCount: 2 performs double-click", async () => {
    const page = v3.context.pages()[0];
    await page.goto(doubleClickFixtureUrl);
    await page.waitForLoadState("domcontentloaded");

    const countDisplay = page.locator("#clickCount");
    const dcCountDisplay = page.locator("#dblClickCount");
    const clickDetailDisplay = page.locator("#lastClickDetail");
    const dblClickDetailDisplay = page.locator("#lastDblClickDetail");

    const initialCount = await countDisplay.inputValue();
    const initialDcCount = await dcCountDisplay.inputValue();
    expect(initialCount).toBe("0");
    expect(initialDcCount).toBe("0");

    const clickArea = page.locator("#target");
    await clickArea.click({ clickCount: 2 });

    const newCount = await countDisplay.inputValue();
    expect(newCount).toBe("2");

    const newDcCount = await dcCountDisplay.inputValue();
    expect(newDcCount).toBe("1");
    // `dblclick` is the browser-level contract for double-click behavior.
    // Verifying `detail=2` ensures the click sequence is recognized as a true multi-click.
    expect(await clickDetailDisplay.inputValue()).toBe("2");
    expect(await dblClickDetailDisplay.inputValue()).toBe("2");
  });

  test("locator.click() with clickCount: 3 performs triple-click", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/click-test/",
    );

    // Wait for page to be fully loaded
    await page.waitForLoadState("domcontentloaded");

    const countDisplay = page.locator("#count");
    const initialCount = await countDisplay.inputValue();
    expect(initialCount).toBe("0");

    // Perform triple-click on the textarea
    const clickArea = page.locator("#textarea");
    await clickArea.click({ clickCount: 3 });

    // Verify count incremented by 3
    const newCount = await countDisplay.inputValue();
    expect(newCount).toBe("3");
  });

  test("page.click() performs single click with coordinates", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/click-test/",
    );

    // Wait for page to be fully loaded
    await page.waitForLoadState("domcontentloaded");

    // Get initial count
    const countDisplay = page.locator("#count");
    const initialCount = await countDisplay.inputValue();
    expect(initialCount).toBe("0");

    // Get the centroid of the textarea to click
    const clickArea = page.locator("#textarea");
    const { x, y } = await clickArea.centroid();

    // Perform single click using page.click() with coordinates
    await page.click(x, y);

    // Verify count incremented by 1
    const newCount = await countDisplay.inputValue();
    expect(newCount).toBe("1");
  });

  test("page.click() with clickCount: 2 performs double-click", async () => {
    const page = v3.context.pages()[0];
    await page.goto(doubleClickFixtureUrl);
    await page.waitForLoadState("domcontentloaded");

    const countDisplay = page.locator("#clickCount");
    const dcCountDisplay = page.locator("#dblClickCount");
    const clickDetailDisplay = page.locator("#lastClickDetail");
    const dblClickDetailDisplay = page.locator("#lastDblClickDetail");

    const initialCount = await countDisplay.inputValue();
    const initialDcCount = await dcCountDisplay.inputValue();
    expect(initialCount).toBe("0");
    expect(initialDcCount).toBe("0");

    const clickArea = page.locator("#target");
    const { x, y } = await clickArea.centroid();

    await page.click(x, y, { clickCount: 2 });

    const newCount = await countDisplay.inputValue();
    expect(newCount).toBe("2");

    const newDcCount = await dcCountDisplay.inputValue();
    expect(newDcCount).toBe("1");
    // `dblclick` is the browser-level contract for double-click behavior.
    // Verifying `detail=2` ensures the click sequence is recognized as a true multi-click.
    expect(await clickDetailDisplay.inputValue()).toBe("2");
    expect(await dblClickDetailDisplay.inputValue()).toBe("2");
  });

  test("page.click() with clickCount: 3 performs triple-click", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/click-test/",
    );

    // Wait for page to be fully loaded
    await page.waitForLoadState("domcontentloaded");

    const countDisplay = page.locator("#count");
    const initialCount = await countDisplay.inputValue();
    expect(initialCount).toBe("0");

    // Get the centroid of the textarea to click
    const clickArea = page.locator("#textarea");
    const { x, y } = await clickArea.centroid();

    // Perform triple-click using page.click() with coordinates
    await page.click(x, y, { clickCount: 3 });

    // Verify count incremented by 3
    const newCount = await countDisplay.inputValue();
    expect(newCount).toBe("3");
  });
});


================================================
FILE: packages/core/tests/integration/connect-to-existing-browser.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

const PAGE_TARGET_COUNT = 5;

test.describe("connect to existing Browserbase session", () => {
  test("new Stagehand instance reuses an existing Browserbase session", async () => {
    const browserTarget = (
      process.env.STAGEHAND_BROWSER_TARGET ?? "local"
    ).toLowerCase();
    const isBrowserbase = browserTarget === "browserbase";
    test.skip(!isBrowserbase, "Requires STAGEHAND_BROWSER_TARGET=browserbase");
    test.skip(
      !process.env.BROWSERBASE_API_KEY || !process.env.BROWSERBASE_PROJECT_ID,
      "BROWSERBASE credentials are required",
    );

    const initialStagehand = new V3({
      ...v3DynamicTestConfig,
      disableAPI: true,
    });
    await initialStagehand.init();

    let resumedStagehand: V3 | null = null;

    try {
      const ctx = initialStagehand.context;
      const initialPage = ctx.pages()[0];
      expect(initialPage).toBeDefined();

      for (let i = 0; i < PAGE_TARGET_COUNT; i++) {
        await ctx.newPage(`https://example.com/?tab=${i}`);
      }

      await initialPage?.close();
      await expect
        .poll(() => ctx.pages().length, { timeout: 15_000 })
        .toBe(PAGE_TARGET_COUNT);

      const sessionUrl = initialStagehand.connectURL();
      expect(sessionUrl).toBeTruthy();

      resumedStagehand = new V3({
        env: "LOCAL",
        verbose: 0,
        disablePino: true,
        disableAPI: true,
        logger: v3DynamicTestConfig.logger,
        localBrowserLaunchOptions: {
          cdpUrl: sessionUrl,
        },
      });
      await resumedStagehand.init();

      await expect
        .poll(() => resumedStagehand!.context.pages().length, {
          timeout: 15_000,
        })
        .toBe(PAGE_TARGET_COUNT);

      const resumedPagesCount = resumedStagehand.context.pages().length;
      expect(resumedPagesCount).toBe(PAGE_TARGET_COUNT);
    } finally {
      await closeV3(resumedStagehand);
      await closeV3(initialStagehand);
    }
  });

  test("new Stagehand instance initializes when existing browser has zero pages", async () => {
    const browserTarget = (
      process.env.STAGEHAND_BROWSER_TARGET ?? "local"
    ).toLowerCase();
    const isLocal = browserTarget !== "browserbase";
    test.skip(!isLocal, "Requires STAGEHAND_BROWSER_TARGET=local");

    const initialStagehand = new V3({
      ...v3DynamicTestConfig,
      disableAPI: true,
      env: "LOCAL",
    });
    await initialStagehand.init();

    let resumedStagehand: V3 | null = null;

    try {
      const ctx = initialStagehand.context;
      const pages = ctx.pages();
      for (const page of pages) {
        await page.close();
      }

      await expect.poll(() => ctx.pages().length, { timeout: 15_000 }).toBe(0);

      const sessionUrl = initialStagehand.connectURL();
      resumedStagehand = new V3({
        env: "LOCAL",
        verbose: 0,
        disablePino: true,
        disableAPI: true,
        logger: v3DynamicTestConfig.logger,
        localBrowserLaunchOptions: {
          cdpUrl: sessionUrl,
        },
      });

      await resumedStagehand.init();

      await expect
        .poll(() => resumedStagehand!.context.pages().length, {
          timeout: 15_000,
        })
        .toBeGreaterThan(0);
    } finally {
      await closeV3(resumedStagehand);
      await closeV3(initialStagehand);
    }
  });
});


================================================
FILE: packages/core/tests/integration/context-addInitScript.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { V3Context } from "../../lib/v3/understudy/context.js";
import type { Page as V3Page } from "../../lib/v3/understudy/page.js";

const POPUP_TIMEOUT_MS = 20_000;

const toDataUrl = (html: string): string =>
  `data:text/html,${encodeURIComponent(html)}`;

const waitForPopupPage = async (
  ctx: V3Context,
  knownTargetIds: Set<string>,
  timeoutMs = POPUP_TIMEOUT_MS,
): Promise<V3Page> => {
  const deadline = Date.now() + timeoutMs;
  while (Date.now() < deadline) {
    const popup = ctx
      .pages()
      .find((page) => !knownTargetIds.has(page.targetId()));
    if (popup) return popup;
    try {
      const active = await ctx.awaitActivePage(500);
      if (!knownTargetIds.has(active.targetId())) return active;
    } catch {
      // keep polling
    }
    await new Promise((resolve) => setTimeout(resolve, 50));
  }
  throw new Error("Popup page was not created");
};

test.describe("context.addInitScript", () => {
  let v3: V3;
  let ctx: V3Context;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
    ctx = v3.context;
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("runs before inline document scripts on navigation", async () => {
    const page = await ctx.awaitActivePage();

    await ctx.addInitScript(() => {
      (window as unknown as { __fromContextInit?: string }).__fromContextInit =
        "injected-value";
    });

    const html = `<!DOCTYPE html>
      <html>
        <body>
          <script>
            var value = (window && window.__fromContextInit) || 'missing';
            document.body.dataset.initWitness = value;
          </script>
        </body>
      </html>`;

    await page.goto(toDataUrl(html), { waitUntil: "load" });

    const observed = await page.evaluate(() => {
      return document.body.dataset.initWitness;
    });
    expect(observed).toBe("injected-value");
  });

  test("re-applies the script on every navigation for the same page", async () => {
    const page = await ctx.awaitActivePage();

    await ctx.addInitScript(`
      (function () {
        function markVisit() {
          var root = document.documentElement;
          if (!root) return;
          var current = Number(window.name || "0");
          var next = current + 1;
          window.name = String(next);
          root.dataset.visitCount = String(next);
        }
        if (document.readyState === "loading") {
          document.addEventListener("DOMContentLoaded", markVisit, {
            once: true,
          });
        } else {
          markVisit();
        }
      })();
    `);

    await page.goto(toDataUrl("<html><body>first</body></html>"), {
      waitUntil: "load",
    });
    const first = await page.evaluate(() => {
      return Number(document.documentElement.dataset.visitCount ?? "0");
    });
    expect(first).toBe(1);

    await page.goto(toDataUrl("<html><body>second</body></html>"), {
      waitUntil: "load",
    });
    const second = await page.evaluate(() => {
      return Number(document.documentElement.dataset.visitCount ?? "0");
    });
    expect(second).toBe(2);
  });

  test("applies script (with args) to newly created pages", async () => {
    const payload = { greeting: "hi", nested: { count: 2 } };

    const initPayload = ((arg) => {
      function setPayload() {
        const root = document.documentElement;
        if (!root) return;
        root.dataset.initPayload = JSON.stringify(arg);
      }
      if (document.readyState === "loading") {
        document.addEventListener("DOMContentLoaded", setPayload, {
          once: true,
        });
      } else {
        setPayload();
      }
    }) as (arg: typeof payload) => void;
    await ctx.addInitScript(initPayload, payload);

    const newPage = await ctx.newPage();
    await newPage.goto(toDataUrl("<html><body>child</body></html>"), {
      waitUntil: "load",
    });

    const observed = await newPage.evaluate(() => {
      const raw = document.documentElement.dataset.initPayload;
      return raw ? JSON.parse(raw) : undefined;
    });
    expect(observed).toEqual(payload);
  });

  test("applies script to newPage(url) on initial document", async () => {
    const payload = { marker: "newPageUrl" };

    await ctx.addInitScript((arg) => {
      function setPayload(): void {
        const root = document.documentElement;
        if (!root) return;
        root.dataset.initPayload = JSON.stringify(arg);
      }
      if (document.readyState === "loading") {
        document.addEventListener("DOMContentLoaded", setPayload, {
          once: true,
        });
      } else {
        setPayload();
      }
    }, payload);

    const newPage = await ctx.newPage(
      toDataUrl("<html><body>new page</body></html>"),
    );
    await newPage.waitForLoadState("load");

    const observed = await newPage.evaluate(() => {
      const raw = document.documentElement.dataset.initPayload;
      return raw ? JSON.parse(raw) : undefined;
    });
    expect(observed).toEqual(payload);
  });

  test("applies script to pages opened via link clicks", async () => {
    const payload = { marker: "linkClick" };

    await ctx.addInitScript((arg) => {
      function setPayload(): void {
        const root = document.documentElement;
        if (!root) return;
        root.dataset.initPayload = JSON.stringify(arg);
      }
      if (document.readyState === "loading") {
        document.addEventListener("DOMContentLoaded", setPayload, {
          once: true,
        });
      } else {
        setPayload();
      }
    }, payload);

    const popupUrl = "https://example.com/";
    const openerHtml =
      "<!DOCTYPE html>" +
      "<html><body>" +
      '<a id="open" target="_blank" href="' +
      popupUrl +
      '">open</a>' +
      "</body></html>";

    const opener = await ctx.awaitActivePage();
    await opener.goto(toDataUrl(openerHtml), { waitUntil: "load" });
    const knownTargetIds = new Set(ctx.pages().map((p) => p.targetId()));
    await opener.locator("#open").click();

    const popup = await waitForPopupPage(ctx, knownTargetIds);

    await popup.waitForLoadState("load");

    const observed = await popup.evaluate(() => {
      const raw = document.documentElement.dataset.initPayload;
      return raw ? JSON.parse(raw) : undefined;
    });
    expect(observed).toEqual(payload);

    await popup.reload({ waitUntil: "load" });
    const observedAfterReload = await popup.evaluate(() => {
      const raw = document.documentElement.dataset.initPayload;
      return raw ? JSON.parse(raw) : undefined;
    });
    expect(observedAfterReload).toEqual(payload);
  });

  test("applies script to in-process popup", async () => {
    await ctx.addInitScript(() => {
      (window as unknown as { __injected?: number }).__injected = 123;
    });

    const opener = await ctx.awaitActivePage();
    const openerHtml =
      "<!DOCTYPE html>" +
      "<html><body>" +
      '<a id="open" target="_blank" href="about:blank">open</a>' +
      "</body></html>";
    await opener.goto(toDataUrl(openerHtml), { waitUntil: "load" });
    const knownTargetIds = new Set(ctx.pages().map((p) => p.targetId()));
    await opener.locator("#open").click();

    const popup = await waitForPopupPage(ctx, knownTargetIds);
    await popup.waitForLoadState("load");
    const injected = await popup.evaluate(() => {
      return (window as unknown as { __injected?: number }).__injected;
    });
    expect(injected).toBe(123);
  });

  test("applies script to cross-process popup and survives reload", async () => {
    await ctx.addInitScript(() => {
      (window as unknown as { __injected?: number }).__injected = 123;
    });

    const opener = await ctx.awaitActivePage();
    const openerHtml =
      "<!DOCTYPE html>" +
      "<html><body>" +
      '<a id="open" target="_blank" href="https://example.com/">open</a>' +
      "</body></html>";
    await opener.goto(toDataUrl(openerHtml), {
      waitUntil: "load",
    });
    const knownTargetIds = new Set(ctx.pages().map((p) => p.targetId()));
    await opener.locator("#open").click();

    const popup = await waitForPopupPage(ctx, knownTargetIds);
    await popup.waitForLoadState("load");

    const injected = await popup.evaluate(() => {
      return (window as unknown as { __injected?: number }).__injected;
    });
    expect(injected).toBe(123);

    await popup.reload({ waitUntil: "load" });
    const injectedAfterReload = await popup.evaluate(() => {
      return (window as unknown as { __injected?: number }).__injected;
    });
    expect(injectedAfterReload).toBe(123);
  });

  test("applies script to cross-process popup opened via window.open and survives reload", async () => {
    await ctx.addInitScript(() => {
      (window as unknown as { __injected?: number }).__injected = 789;
    });

    const opener = await ctx.awaitActivePage();
    await opener.goto("about:blank", { waitUntil: "load" });
    await opener.mainFrame().evaluate(() => {
      const button = document.createElement("button");
      button.id = "open-via-window-open";
      button.textContent = "open popup";
      button.addEventListener("click", () => {
        window.open("https://example.com/", "_blank");
      });
      document.body.appendChild(button);
    });

    const knownTargetIds = new Set(ctx.pages().map((p) => p.targetId()));
    await opener.locator("#open-via-window-open").click();

    const popup = await waitForPopupPage(ctx, knownTargetIds);
    await popup.waitForLoadState("load");

    const injected = await popup.evaluate(() => {
      return (window as unknown as { __injected?: number }).__injected;
    });
    expect(injected).toBe(789);

    await popup.reload({ waitUntil: "load" });
    const injectedAfterReload = await popup.evaluate(() => {
      return (window as unknown as { __injected?: number }).__injected;
    });
    expect(injectedAfterReload).toBe(789);
  });

  test("context.addInitScript installs a function callable from page.evaluate", async () => {
    const page = await ctx.awaitActivePage();

    await ctx.addInitScript(() => {
      // installed before any navigation
      // eslint-disable-next-line @typescript-eslint/ban-ts-comment
      // @ts-expect-error
      window.sayHelloFromStagehand = () => "hello from stagehand";
    });

    await page.goto("https://example.com", { waitUntil: "domcontentloaded" });

    const result = await page.evaluate(() => {
      // eslint-disable-next-line @typescript-eslint/ban-ts-comment
      // @ts-expect-error
      return window.sayHelloFromStagehand();
    });

    expect(result).toBe("hello from stagehand");
  });
});


================================================
FILE: packages/core/tests/integration/context-extra-http-headers.spec.ts
================================================
import { test, expect } from "@playwright/test";
import type { Protocol } from "devtools-protocol";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { closeV3 } from "./testUtils.js";

const TEST_URL =
  "https://browserbase.github.io/stagehand-eval-sites/sites/example/";

test.describe("context.setExtraHTTPHeaders", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("applies headers to navigation requests", async () => {
    const ctx = v3.context;
    const page = await ctx.awaitActivePage();

    await ctx.setExtraHTTPHeaders({ "x-stagehand-test": "yes" });

    const internal = page as unknown as {
      mainSession: {
        send: (method: string, params?: unknown) => Promise<unknown>;
        on: (event: string, handler: (params: unknown) => void) => void;
        off: (event: string, handler: (params: unknown) => void) => void;
      };
    };

    await internal.mainSession.send("Network.enable");

    const requestPromise = new Promise<Protocol.Network.RequestWillBeSentEvent>(
      (resolve, reject) => {
        const timeout = setTimeout(() => {
          internal.mainSession.off("Network.requestWillBeSent", handler);
          reject(new Error("Timed out waiting for request"));
        }, 5000);

        const handler = (evt: Protocol.Network.RequestWillBeSentEvent) => {
          if (evt.type !== "Document") return;
          const url = String(evt.request?.url ?? "");
          if (!url.startsWith(TEST_URL)) return;
          clearTimeout(timeout);
          internal.mainSession.off("Network.requestWillBeSent", handler);
          resolve(evt);
        };

        internal.mainSession.on("Network.requestWillBeSent", handler);
      },
    );

    await page.goto(TEST_URL, { waitUntil: "domcontentloaded" });

    const request = await requestPromise;
    const headers = Object.fromEntries(
      Object.entries(request.request.headers ?? {}).map(([key, value]) => [
        key.toLowerCase(),
        String(value),
      ]),
    );

    expect(headers["x-stagehand-test"]).toBe("yes");
  });
});


================================================
FILE: packages/core/tests/integration/cookies.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

const BASE_URL =
  "https://browserbase.github.io/stagehand-eval-sites/sites/example/";

test.describe("cookies", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("addCookies sets a cookie visible to the page", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0];
    expect(page).toBeDefined();

    await page!.goto(BASE_URL);

    const name = `stagehand_cookie_${Date.now()}`;
    await ctx.addCookies([
      {
        name,
        value: "1",
        url: BASE_URL,
        httpOnly: false,
      },
    ]);

    await page!.reload();

    const cookieString = await page!.evaluate(() => document.cookie);
    expect(cookieString).toContain(`${name}=1`);

    const cookies = await ctx.cookies(BASE_URL);
    expect(cookies.some((c) => c.name === name && c.value === "1")).toBe(true);
  });

  test("cookies() with no URL returns all cookies", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    const name = `stagehand_all_${Date.now()}`;
    await ctx.addCookies([
      { name, value: "all", url: BASE_URL, httpOnly: false },
    ]);

    const all = await ctx.cookies();
    expect(all.some((c) => c.name === name)).toBe(true);
  });

  test("clearCookies() removes all cookies", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    await ctx.addCookies([
      { name: "to_clear_a", value: "1", url: BASE_URL, httpOnly: false },
      { name: "to_clear_b", value: "2", url: BASE_URL, httpOnly: false },
    ]);

    // Verify cookies were set
    let cookies = await ctx.cookies(BASE_URL);
    expect(cookies.some((c) => c.name === "to_clear_a")).toBe(true);
    expect(cookies.some((c) => c.name === "to_clear_b")).toBe(true);

    await ctx.clearCookies();

    cookies = await ctx.cookies(BASE_URL);
    expect(cookies.some((c) => c.name === "to_clear_a")).toBe(false);
    expect(cookies.some((c) => c.name === "to_clear_b")).toBe(false);
  });

  test("clearCookies() with name filter removes only matching cookies", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    await ctx.addCookies([
      { name: "keep_me", value: "1", url: BASE_URL, httpOnly: false },
      { name: "remove_me", value: "2", url: BASE_URL, httpOnly: false },
    ]);

    await ctx.clearCookies({ name: "remove_me" });

    const cookies = await ctx.cookies(BASE_URL);
    expect(cookies.some((c) => c.name === "keep_me")).toBe(true);
    expect(cookies.some((c) => c.name === "remove_me")).toBe(false);
  });

  test("clearCookies() with regex filter removes matching cookies", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    await ctx.addCookies([
      { name: "_ga_ABC", value: "1", url: BASE_URL, httpOnly: false },
      { name: "_ga_DEF", value: "2", url: BASE_URL, httpOnly: false },
      { name: "session", value: "3", url: BASE_URL, httpOnly: false },
    ]);

    await ctx.clearCookies({ name: /^_ga/ });

    const cookies = await ctx.cookies(BASE_URL);
    expect(cookies.some((c) => c.name === "session")).toBe(true);
    expect(cookies.some((c) => c.name === "_ga_ABC")).toBe(false);
    expect(cookies.some((c) => c.name === "_ga_DEF")).toBe(false);
  });

  test("cookies are visible from a second page on the same domain", async () => {
    const ctx = v3.context;
    const page1 = ctx.pages()[0]!;
    await page1.goto(BASE_URL);

    const name = `stagehand_multi_${Date.now()}`;
    await ctx.addCookies([
      { name, value: "shared", url: BASE_URL, httpOnly: false },
    ]);

    const page2 = await ctx.newPage();
    await page2.goto(BASE_URL);

    const cookieString = await page2.evaluate(() => document.cookie);
    expect(cookieString).toContain(`${name}=shared`);
  });

  test("cookies persist across navigation to a different path", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    const name = `stagehand_nav_${Date.now()}`;
    await ctx.addCookies([
      {
        name,
        value: "persisted",
        domain: "browserbase.github.io",
        path: "/",
        httpOnly: false,
      },
    ]);

    // Navigate to a different path on the same domain
    await page.goto("https://browserbase.github.io/stagehand-eval-sites/");

    const cookieString = await page.evaluate(() => document.cookie);
    expect(cookieString).toContain(`${name}=persisted`);
  });

  test("httpOnly cookie is hidden from document.cookie but returned by cookies()", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    const name = `stagehand_http_${Date.now()}`;
    await ctx.addCookies([
      { name, value: "secret", url: BASE_URL, httpOnly: true },
    ]);

    await page.reload();

    // document.cookie must NOT include httpOnly cookies
    const cookieString = await page.evaluate(() => document.cookie);
    expect(cookieString).not.toContain(name);

    // But the context API should still return it
    const cookies = await ctx.cookies(BASE_URL);
    const match = cookies.find((c) => c.name === name);
    expect(match).toBeDefined();
    expect(match!.value).toBe("secret");
    expect(match!.httpOnly).toBe(true);
  });

  test("cookies() returns correct shape for a fully-specified cookie", async () => {
    const ctx = v3.context;
    const page = ctx.pages()[0]!;
    await page.goto(BASE_URL);

    const name = `stagehand_shape_${Date.now()}`;
    const expires = Math.floor(Date.now() / 1000) + 3600; // 1 hour from now
    await ctx.addCookies([
      {
        name,
        value: "full",
        domain: "browserbase.github.io",
        path: "/",
        expires,
        httpOnly: true,
        secure: true,
        sameSite: "Lax",
      },
    ]);

    const cookies = await ctx.cookies(BASE_URL);
    const match = cookies.find((c) => c.name === name);
    expect(match).toBeDefined();

    // Validate every field on the returned Cookie object
    expect(match!.value).toBe("full");
    expect(match!.domain).toMatch(/browserbase\.github\.io/);
    expect(match!.path).toBe("/");
    expect(match!.expires).toBeGreaterThan(0);
    expect(match!.httpOnly).toBe(true);
    expect(match!.secure).toBe(true);
    expect(match!.sameSite).toBe("Lax");

    // Ensure no extra fields leak through from CDP
    const keys = Object.keys(match!);
    expect(keys.sort()).toEqual(
      [
        "name",
        "value",
        "domain",
        "path",
        "expires",
        "httpOnly",
        "secure",
        "sameSite",
      ].sort(),
    );
  });
});


================================================
FILE: packages/core/tests/integration/default-page-tracking.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe.configure({ mode: "parallel" });
test.describe("V3 default page tracking", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("activePage points to initial page", async () => {
    const ctx = v3.context;
    // Should have at least one top-level page
    const pages = ctx.pages();
    expect(pages.length).toBeGreaterThanOrEqual(1);
    const active = ctx.activePage();
    expect(active).toBeTruthy();
    // mainFrameId should be a non-empty string
    expect(active!.mainFrameId().length).toBeGreaterThan(0);
  });

  test("activePage switches to most recent top-level page and reverts on close", async () => {
    const ctx = v3.context;
    const newPage = await ctx.newPage("https://example.com/");

    const activeAfterCreate = await ctx.awaitActivePage();
    expect(activeAfterCreate.url()).toContain(newPage.url());
  });

  test("popup default-page flow via five-tab site", async () => {
    const ctx = v3.context;

    // 1) Navigate the default page to the site
    const root = await ctx.awaitActivePage();
    await root!.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/",
      { waitUntil: "load", timeoutMs: 15000 },
    );
    // 2) Click button on the page to open a new tab → page2.html
    await root.locator("xpath=/html/body/button").click();
    const page2 = await ctx.awaitActivePage();
    expect(page2!.url()).toBe(
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/page2.html",
    );

    // 3) On the default page (now page2), click its button → open page3 popup

    await page2.locator("xpath=/html/body/button").click();
    const page3 = await ctx.awaitActivePage();
    expect(page3!.url()).toBe(
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/page3.html",
    );

    // 4) Close the current page (page3) and ensure the default page reverts to page2
    await page3!.close();
    const backToPage2 = await ctx.awaitActivePage();
    expect(backToPage2!.url()).toBe(
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/page2.html",
    );
  });
});


================================================
FILE: packages/core/tests/integration/downloads.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import Browserbase from "@browserbasehq/sdk";
import AdmZip from "adm-zip";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

const pdfRe = /sample-(\d{13})+\.pdf/;
test.describe("downloads on browserbase", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("downloaded pdf is available via downloads api", async () => {
    const browserTarget = (
      process.env.STAGEHAND_BROWSER_TARGET ?? "local"
    ).toLowerCase();
    const isBrowserbase = browserTarget === "browserbase";
    // Skip this test in LOCAL mode as it requires Browserbase session
    test.skip(
      !isBrowserbase,
      "Skipping Browserbase-only downloads test in LOCAL mode",
    );

    // Skip if BROWSERBASE_API_KEY is not set
    test.skip(
      !process.env.BROWSERBASE_API_KEY,
      "Skipping test: BROWSERBASE_API_KEY not set",
    );

    // Tiny timeout to force the race to hit the timeout branch
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/download-on-click/",
    );
    await page.locator("/html/body/button").click();

    await expect(async () => {
      const bb = new Browserbase();
      const zipBuffer = await bb.sessions.downloads.list(
        v3.browserbaseSessionId,
      );
      if (!zipBuffer) {
        throw new Error(
          `Download buffer is empty for session ${v3.browserbaseSessionId}`,
        );
      }

      const zip = new AdmZip(Buffer.from(await zipBuffer.arrayBuffer()));
      const zipEntries = zip.getEntries();
      const pdfEntry = zipEntries.find((entry) => pdfRe.test(entry.entryName));

      if (!pdfEntry) {
        throw new Error(
          `Session ${v3.browserbaseSessionId} is missing a file matching "${pdfRe.toString()}" in its zip entries: ${JSON.stringify(zipEntries.map((entry) => entry.entryName))}`,
        );
      }

      const expectedFileSize = 13264;
      expect(pdfEntry.header.size).toBe(expectedFileSize);
    }).toPass({
      timeout: 30_000,
    });
  });
});


================================================
FILE: packages/core/tests/integration/flowLogger.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { z } from "zod";
import { InMemoryEventSink } from "../../lib/v3/flowlogger/EventSink.js";
import { FlowEvent } from "../../lib/v3/flowlogger/FlowLogger.js";
import { performUnderstudyMethod } from "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js";
import { V3 } from "../../lib/v3/v3.js";
import {
  createScriptedAisdkTestLlmClient,
  closeV3,
  doneToolResponse,
  findLastEncodedId,
  toolCallResponse,
} from "./testUtils.js";
import { getV3TestConfig } from "./v3.config.js";

function encodeHtml(html: string): string {
  return `data:text/html,${encodeURIComponent(html)}`;
}

function createRecordedFlowLoggerV3(
  overrides: Parameters<typeof getV3TestConfig>[0] = {},
): V3 {
  const v3 = new V3(getV3TestConfig(overrides));
  const sink = new InMemoryEventSink();
  v3.bus.on("*", (event: unknown) => {
    if (event instanceof FlowEvent) {
      void sink.emit(event);
    }
  });
  v3.eventStore.query = (query) =>
    sink.query({ ...query, sessionId: v3.eventStore.sessionId });
  return v3;
}

async function listRecordedFlowEvents(v3: V3): Promise<FlowEvent[]> {
  return v3.eventStore.query({});
}

async function captureFlowEventBaseline(v3: V3): Promise<Set<string>> {
  const events = await listRecordedFlowEvents(v3);
  return new Set(events.map((event) => event.eventId));
}

async function listRecordedFlowEventsSince(
  v3: V3,
  baseline: Set<string>,
): Promise<FlowEvent[]> {
  const events = await listRecordedFlowEvents(v3);
  return events.filter((event) => !baseline.has(event.eventId));
}

function eventsOfType(events: FlowEvent[], eventType: string): FlowEvent[] {
  return events.filter((event) => event.eventType === eventType);
}

function requireSingleEvent(events: FlowEvent[], eventType: string): FlowEvent {
  const matches = eventsOfType(events, eventType);
  expect(matches, `expected a single ${eventType}`).toHaveLength(1);
  return matches[0];
}

function expectRootEvent(event: FlowEvent): void {
  expect(event.eventParentIds).toEqual([]);
}

function expectDirectParent(child: FlowEvent, parent: FlowEvent): void {
  expect(child.eventParentIds).toEqual([
    ...parent.eventParentIds,
    parent.eventId,
  ]);
}

function assertAllParentIdsResolve(events: FlowEvent[]): void {
  const eventIds = new Set(events.map((event) => event.eventId));

  for (const event of events) {
    for (const parentId of event.eventParentIds) {
      expect(
        eventIds.has(parentId),
        `${event.eventType} references missing parent ${parentId}`,
      ).toBe(true);
    }
  }
}

function assertSessionIds(events: FlowEvent[], sessionId: string): void {
  for (const event of events) {
    expect(event.sessionId).toBe(sessionId);
  }
}

function directChildrenOfType(
  events: FlowEvent[],
  parent: FlowEvent,
  eventType: string,
): FlowEvent[] {
  const expectedParentIds = [...parent.eventParentIds, parent.eventId];
  return events.filter(
    (event) =>
      event.eventType === eventType &&
      JSON.stringify(event.eventParentIds) ===
        JSON.stringify(expectedParentIds),
  );
}

function assertCompletedEnvelope(
  events: FlowEvent[],
  eventType: string,
  completedEventType = `${eventType.replace(/Event$/, "")}CompletedEvent`,
): FlowEvent {
  const root = requireSingleEvent(events, eventType);
  const completed = requireSingleEvent(events, completedEventType);
  expectDirectParent(completed, root);
  return root;
}

function assertNoFloatingLlmEvents(events: FlowEvent[]): void {
  const llmEvents = events.filter(
    (event) =>
      event.eventType === "LlmRequestEvent" ||
      event.eventType === "LlmResponseEvent",
  );
  const byId = new Map(events.map((event) => [event.eventId, event]));

  expect(llmEvents.length).toBeGreaterThan(0);

  for (const event of llmEvents) {
    expect(
      event.eventParentIds.length,
      `${event.eventType} is floating`,
    ).toBeGreaterThan(0);
    const lastParentId = event.eventParentIds.at(-1);
    const lastParent = lastParentId ? byId.get(lastParentId) : undefined;
    expect(
      lastParent,
      `${event.eventType} has no resolved parent`,
    ).toBeDefined();
    expect(lastParent?.eventType.startsWith("Llm")).toBe(false);
  }
}

function assertNoFloatingCdpEvents(events: FlowEvent[]): void {
  const cdpEvents = events.filter((event) => event.eventType.startsWith("Cdp"));
  const byId = new Map(events.map((event) => [event.eventId, event]));

  expect(cdpEvents.length).toBeGreaterThan(0);

  for (const event of cdpEvents) {
    expect(
      event.eventParentIds.length,
      `${event.eventType} is floating`,
    ).toBeGreaterThan(0);
    const lastParentId = event.eventParentIds.at(-1);
    const lastParent = lastParentId ? byId.get(lastParentId) : undefined;
    expect(
      lastParent,
      `${event.eventType} has no resolved parent`,
    ).toBeDefined();

    if (event.eventType === "CdpCallEvent") {
      expect(lastParent?.eventType.startsWith("Cdp")).toBe(false);
    } else {
      expect(lastParent?.eventType).toBe("CdpCallEvent");
    }
  }
}

function assertDirectRootCdpEvents(
  events: FlowEvent[],
  sessionId: string,
): void {
  const call = requireSingleEvent(events, "CdpCallEvent");
  const responseTypes = ["CdpResponseEvent", "CdpResponseErrorEvent"];
  const response = events.find((event) =>
    responseTypes.includes(event.eventType),
  );

  expect(response, "expected a direct CDP response event").toBeDefined();
  assertSessionIds(events, sessionId);
  expectRootEvent(call);
  expect(response?.eventParentIds).toEqual([call.eventId]);
}

function sortCountRecord(
  input: Record<string, number>,
): Record<string, number> {
  return Object.fromEntries(
    Object.entries(input).sort(([left], [right]) => left.localeCompare(right)),
  );
}

function assertNonCdpEventCounts(
  events: FlowEvent[],
  expected: Record<string, number>,
): void {
  const actual = events.reduce<Record<string, number>>((counts, event) => {
    if (event.eventType.startsWith("Cdp")) {
      return counts;
    }

    counts[event.eventType] = (counts[event.eventType] ?? 0) + 1;
    return counts;
  }, {});

  expect(sortCountRecord(actual)).toEqual(sortCountRecord(expected));
}

test.describe("flow logger integration", () => {
  test.describe.configure({ mode: "serial" });

  test("act emits a rooted tree with nested understudy, llm, and cdp events", async () => {
    const buttonText = "Flow Logger Act Button";
    const llmClient = createScriptedAisdkTestLlmClient({
      jsonResponses: {
        act: (options) => ({
          elementId: findLastEncodedId(options),
          description: `click ${buttonText}`,
          method: "click",
          arguments: [],
          twoStep: false,
        }),
      },
    });

    const v3 = createRecordedFlowLoggerV3({
      llmClient,
    });

    await v3.init();

    try {
      const page = v3.context.pages()[0];
      await page.goto(
        encodeHtml(`
          <!doctype html>
          <html>
            <body>
              <button
                id="act-target"
                onclick="document.body.dataset.clicked='true'"
              >
                ${buttonText}
              </button>
            </body>
          </html>
        `),
      );

      const baseline = await captureFlowEventBaseline(v3);
      const result = await v3.act(`Click the ${buttonText}`);
      const events = await listRecordedFlowEventsSince(v3, baseline);

      expect(result.success).toBe(true);
      expect(
        await page.evaluate(() => document.body.dataset.clicked ?? ""),
      ).toBe("true");
      const root = requireSingleEvent(events, "StagehandActEvent");
      const completed = requireSingleEvent(
        events,
        "StagehandActCompletedEvent",
      );
      const llmRequest = requireSingleEvent(events, "LlmRequestEvent");
      const llmResponse = requireSingleEvent(events, "LlmResponseEvent");
      const understudy = requireSingleEvent(events, "UnderstudyClickEvent");
      const understudyCompleted = requireSingleEvent(
        events,
        "UnderstudyClickCompletedEvent",
      );

      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        LlmRequestEvent: 1,
        LlmResponseEvent: 1,
        StagehandActCompletedEvent: 1,
        StagehandActEvent: 1,
        UnderstudyClickCompletedEvent: 1,
        UnderstudyClickEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(root);
      expectDirectParent(completed, root);
      expect(llmRequest.eventParentIds).toEqual([root.eventId]);
      expect(llmResponse.eventParentIds).toEqual([root.eventId]);
      expect(understudy.eventParentIds).toEqual([root.eventId]);
      expectDirectParent(understudyCompleted, understudy);
      assertNoFloatingLlmEvents(events);
      assertNoFloatingCdpEvents(events);
    } finally {
      await closeV3(v3);
    }
  });

  test("observe and extract emit rooted trees with complete nested llm and cdp events", async () => {
    const observeText = "Flow Logger Observe Button";
    const extractTitle = "Flow Logger Extract Title";
    const llmClient = createScriptedAisdkTestLlmClient({
      jsonResponses: {
        Observation: (options) => ({
          elements: [
            {
              elementId: findLastEncodedId(options),
              description: observeText,
              method: "click",
              arguments: [],
            },
          ],
        }),
        Extraction: {
          title: extractTitle,
        },
        Metadata: {
          completed: true,
          progress: "done",
        },
      },
    });

    const v3 = createRecordedFlowLoggerV3({
      llmClient,
    });

    await v3.init();

    try {
      const page = v3.context.pages()[0];
      await page.goto(
        encodeHtml(`
          <!doctype html>
          <html>
            <body>
              <button id="observe-target">${observeText}</button>
              <h1>${extractTitle}</h1>
            </body>
          </html>
        `),
      );

      const observeBaseline = await captureFlowEventBaseline(v3);
      const observeResult = await v3.observe(`Find the ${observeText}`);

      expect(observeResult).toHaveLength(1);
      expect(observeResult[0].method).toBe("click");

      const observeEvents = await listRecordedFlowEventsSince(
        v3,
        observeBaseline,
      );
      const observeRoot = requireSingleEvent(
        observeEvents,
        "StagehandObserveEvent",
      );
      const observeCompleted = requireSingleEvent(
        observeEvents,
        "StagehandObserveCompletedEvent",
      );
      const observeLlmRequests = eventsOfType(observeEvents, "LlmRequestEvent");
      const observeLlmResponses = eventsOfType(
        observeEvents,
        "LlmResponseEvent",
      );

      assertAllParentIdsResolve(observeEvents);
      assertNonCdpEventCounts(observeEvents, {
        LlmRequestEvent: 1,
        LlmResponseEvent: 1,
        StagehandObserveCompletedEvent: 1,
        StagehandObserveEvent: 1,
      });
      assertSessionIds(observeEvents, v3.flowLoggerContext.sessionId);
      expectRootEvent(observeRoot);
      expectDirectParent(observeCompleted, observeRoot);
      expect(observeLlmRequests).toHaveLength(1);
      expect(observeLlmResponses).toHaveLength(1);
      expect(observeLlmRequests[0].eventParentIds).toEqual([
        observeRoot.eventId,
      ]);
      expect(observeLlmResponses[0].eventParentIds).toEqual([
        observeRoot.eventId,
      ]);
      assertNoFloatingLlmEvents(observeEvents);
      assertNoFloatingCdpEvents(observeEvents);

      const extractBaseline = await captureFlowEventBaseline(v3);
      const extractResult = await v3.extract(
        "Extract the title",
        z.object({ title: z.string() }),
      );

      expect(extractResult).toEqual({ title: extractTitle });

      const extractEvents = await listRecordedFlowEventsSince(
        v3,
        extractBaseline,
      );
      const extractRoot = requireSingleEvent(
        extractEvents,
        "StagehandExtractEvent",
      );
      const extractCompleted = requireSingleEvent(
        extractEvents,
        "StagehandExtractCompletedEvent",
      );
      const extractLlmRequests = eventsOfType(extractEvents, "LlmRequestEvent");
      const extractLlmResponses = eventsOfType(
        extractEvents,
        "LlmResponseEvent",
      );

      assertAllParentIdsResolve(extractEvents);
      assertNonCdpEventCounts(extractEvents, {
        LlmRequestEvent: 2,
        LlmResponseEvent: 2,
        StagehandExtractCompletedEvent: 1,
        StagehandExtractEvent: 1,
      });
      assertSessionIds(extractEvents, v3.flowLoggerContext.sessionId);
      expectRootEvent(extractRoot);
      expectDirectParent(extractCompleted, extractRoot);
      expect(extractLlmRequests).toHaveLength(2);
      expect(extractLlmResponses).toHaveLength(2);

      for (const event of [...extractLlmRequests, ...extractLlmResponses]) {
        expect(event.eventParentIds).toEqual([extractRoot.eventId]);
      }

      assertNoFloatingLlmEvents(extractEvents);
      assertNoFloatingCdpEvents(extractEvents);
    } finally {
      await closeV3(v3);
    }
  });

  test("agent.execute -> act carries the full agent -> stagehand -> understudy -> cdp + llm hierarchy", async () => {
    const buttonText = "Agent Act Button";
    const llmClient = createScriptedAisdkTestLlmClient({
      jsonResponses: {
        act: (options) => ({
          elementId: findLastEncodedId(options),
          description: `click ${buttonText}`,
          method: "click",
          arguments: [],
          twoStep: false,
        }),
      },
      generateResponses: [
        toolCallResponse("act", { action: `click the ${buttonText}` }, "act-1"),
        doneToolResponse("finished", true, "done-1"),
      ],
    });

    const v3 = createRecordedFlowLoggerV3({
      experimental: true,
      llmClient,
    });

    await v3.init();

    try {
      const page = v3.context.pages()[0];
      await page.goto(
        encodeHtml(`
          <!doctype html>
          <html>
            <body>
              <button
                id="agent-act-target"
                onclick="document.body.dataset.agentAct='true'"
              >
                ${buttonText}
              </button>
            </body>
          </html>
        `),
      );

      const baseline = await captureFlowEventBaseline(v3);
      const result = await v3.agent().execute({
        instruction: `Click the ${buttonText} and finish.`,
        maxSteps: 2,
      });
      const events = await listRecordedFlowEventsSince(v3, baseline);

      expect(result.success).toBe(true);
      expect(
        await page.evaluate(() => document.body.dataset.agentAct ?? ""),
      ).toBe("true");
      const agentRoot = assertCompletedEnvelope(events, "AgentExecuteEvent");
      const actRoot = requireSingleEvent(events, "StagehandActEvent");
      const actCompleted = requireSingleEvent(
        events,
        "StagehandActCompletedEvent",
      );
      const understudy = requireSingleEvent(events, "UnderstudyClickEvent");
      const understudyCompleted = requireSingleEvent(
        events,
        "UnderstudyClickCompletedEvent",
      );

      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        AgentExecuteCompletedEvent: 1,
        AgentExecuteEvent: 1,
        LlmRequestEvent: 3,
        LlmResponseEvent: 3,
        StagehandActCompletedEvent: 1,
        StagehandActEvent: 1,
        UnderstudyClickCompletedEvent: 1,
        UnderstudyClickEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(agentRoot);
      expect(actRoot.eventParentIds).toEqual([agentRoot.eventId]);
      expectDirectParent(actCompleted, actRoot);
      expectDirectParent(understudy, actRoot);
      expectDirectParent(understudyCompleted, understudy);
      expect(
        directChildrenOfType(events, agentRoot, "LlmRequestEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, agentRoot, "LlmResponseEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, actRoot, "LlmRequestEvent"),
      ).toHaveLength(1);
      expect(
        directChildrenOfType(events, actRoot, "LlmResponseEvent"),
      ).toHaveLength(1);
      assertNoFloatingLlmEvents(events);
      assertNoFloatingCdpEvents(events);
    } finally {
      await closeV3(v3);
    }
  });

  test("agent.execute -> fillForm carries the observe -> act -> understudy hierarchy with no missing layers", async () => {
    const llmClient = createScriptedAisdkTestLlmClient({
      jsonResponses: {
        Observation: (options) => ({
          elements: [
            {
              elementId: findLastEncodedId(options),
              description: "name input",
              method: "fill",
              arguments: ["hello"],
            },
          ],
        }),
      },
      generateResponses: [
        toolCallResponse(
          "fillForm",
          {
            fields: [
              {
                action: "type hello into the name field",
                value: "hello",
              },
            ],
          },
          "fillform-1",
        ),
        doneToolResponse("finished", true, "done-1"),
      ],
    });

    const v3 = createRecordedFlowLoggerV3({
      experimental: true,
      llmClient,
    });

    await v3.init();

    try {
      const page = v3.context.pages()[0];
      await page.goto(
        encodeHtml(`
          <!doctype html>
          <html>
            <body>
              <input id="name" />
            </body>
          </html>
        `),
      );

      const baseline = await captureFlowEventBaseline(v3);
      const result = await v3.agent().execute({
        instruction: "Fill the form and finish.",
        maxSteps: 2,
      });
      const events = await listRecordedFlowEventsSince(v3, baseline);

      expect(result.success).toBe(true);
      expect(await page.locator("#name").inputValue()).toBe("hello");

      const agentRoot = assertCompletedEnvelope(events, "AgentExecuteEvent");
      const observeRoot = requireSingleEvent(events, "StagehandObserveEvent");
      const observeCompleted = requireSingleEvent(
        events,
        "StagehandObserveCompletedEvent",
      );
      const actRoot = requireSingleEvent(events, "StagehandActEvent");
      const actCompleted = requireSingleEvent(
        events,
        "StagehandActCompletedEvent",
      );
      const understudyFill = requireSingleEvent(events, "UnderstudyFillEvent");
      const understudyFillCompleted = requireSingleEvent(
        events,
        "UnderstudyFillCompletedEvent",
      );

      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        AgentExecuteCompletedEvent: 1,
        AgentExecuteEvent: 1,
        LlmRequestEvent: 3,
        LlmResponseEvent: 3,
        StagehandActCompletedEvent: 1,
        StagehandActEvent: 1,
        StagehandObserveCompletedEvent: 1,
        StagehandObserveEvent: 1,
        UnderstudyFillCompletedEvent: 1,
        UnderstudyFillEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(agentRoot);
      expect(observeRoot.eventParentIds).toEqual([agentRoot.eventId]);
      expectDirectParent(observeCompleted, observeRoot);
      expect(actRoot.eventParentIds).toEqual([agentRoot.eventId]);
      expectDirectParent(actCompleted, actRoot);
      expectDirectParent(understudyFill, actRoot);
      expectDirectParent(understudyFillCompleted, understudyFill);
      expect(
        directChildrenOfType(events, observeRoot, "LlmRequestEvent"),
      ).toHaveLength(1);
      expect(
        directChildrenOfType(events, observeRoot, "LlmResponseEvent"),
      ).toHaveLength(1);
      expect(
        directChildrenOfType(events, agentRoot, "LlmRequestEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, agentRoot, "LlmResponseEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, actRoot, "LlmRequestEvent"),
      ).toHaveLength(0);
      expect(
        directChildrenOfType(events, actRoot, "LlmResponseEvent"),
      ).toHaveLength(0);
      assertNoFloatingLlmEvents(events);
      assertNoFloatingCdpEvents(events);
    } finally {
      await closeV3(v3);
    }
  });

  test("agent.execute -> extract carries the full agent -> extract -> cdp + llm hierarchy", async () => {
    const extractTitle = "Agent Extract Title";
    const llmClient = createScriptedAisdkTestLlmClient({
      jsonResponses: {
        Extraction: {
          title: extractTitle,
        },
        Metadata: {
          completed: true,
          progress: "done",
        },
      },
      generateResponses: [
        toolCallResponse(
          "extract",
          {
            instruction: "extract the title",
            schema: {
              type: "object",
              properties: {
                title: { type: "string" },
              },
            },
          },
          "extract-1",
        ),
        doneToolResponse("finished", true, "done-1"),
      ],
    });

    const v3 = createRecordedFlowLoggerV3({
      experimental: true,
      llmClient,
    });

    await v3.init();

    try {
      const page = v3.context.pages()[0];
      await page.goto(
        encodeHtml(`
          <!doctype html>
          <html>
            <body>
              <h1>${extractTitle}</h1>
            </body>
          </html>
        `),
      );

      const baseline = await captureFlowEventBaseline(v3);
      const result = await v3.agent().execute({
        instruction: "Extract the title and finish.",
        maxSteps: 2,
      });

      expect(result.success).toBe(true);

      const events = await listRecordedFlowEventsSince(v3, baseline);
      const agentRoot = assertCompletedEnvelope(events, "AgentExecuteEvent");
      const extractRoot = requireSingleEvent(events, "StagehandExtractEvent");
      const extractCompleted = requireSingleEvent(
        events,
        "StagehandExtractCompletedEvent",
      );

      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        AgentExecuteCompletedEvent: 1,
        AgentExecuteEvent: 1,
        LlmRequestEvent: 4,
        LlmResponseEvent: 4,
        StagehandExtractCompletedEvent: 1,
        StagehandExtractEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(agentRoot);
      expect(extractRoot.eventParentIds).toEqual([agentRoot.eventId]);
      expectDirectParent(extractCompleted, extractRoot);
      expect(
        directChildrenOfType(events, agentRoot, "LlmRequestEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, agentRoot, "LlmResponseEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, extractRoot, "LlmRequestEvent"),
      ).toHaveLength(2);
      expect(
        directChildrenOfType(events, extractRoot, "LlmResponseEvent"),
      ).toHaveLength(2);
      assertNoFloatingLlmEvents(events);
      assertNoFloatingCdpEvents(events);
    } finally {
      await closeV3(v3);
    }
  });

  test("agent.execute nests page events under the agent root and direct page calls root themselves", async () => {
    const agentPageUrl = encodeHtml(`
      <!doctype html>
      <html>
        <body>
          <h1>Agent Flow Logger Page</h1>
        </body>
      </html>
    `);
    const agentLlmClient = createScriptedAisdkTestLlmClient({
      generateResponses: [
        toolCallResponse("goto", { url: agentPageUrl }, "goto-1"),
        toolCallResponse("screenshot", {}, "screenshot-1"),
        doneToolResponse("finished", true, "done-1"),
      ],
    });

    const agentV3 = createRecordedFlowLoggerV3({
      experimental: true,
      llmClient: agentLlmClient,
    });

    await agentV3.init();

    try {
      const baseline = await captureFlowEventBaseline(agentV3);
      const result = await agentV3.agent().execute({
        instruction: "Go to the test page, take a screenshot, and finish.",
        maxSteps: 3,
      });

      expect(result.success).toBe(true);
      expect(result.completed).toBe(true);

      const events = await listRecordedFlowEventsSince(agentV3, baseline);
      const root = assertCompletedEnvelope(events, "AgentExecuteEvent");
      const pageGoto = requireSingleEvent(events, "PageGotoEvent");
      const pageGotoCompleted = requireSingleEvent(
        events,
        "PageGotoCompletedEvent",
      );
      const pageScreenshot = requireSingleEvent(events, "PageScreenshotEvent");
      const pageScreenshotCompleted = requireSingleEvent(
        events,
        "PageScreenshotCompletedEvent",
      );
      const llmRequests = eventsOfType(events, "LlmRequestEvent");
      const llmResponses = eventsOfType(events, "LlmResponseEvent");

      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        AgentExecuteCompletedEvent: 1,
        AgentExecuteEvent: 1,
        LlmRequestEvent: 3,
        LlmResponseEvent: 3,
        PageGotoCompletedEvent: 1,
        PageGotoEvent: 1,
        PageScreenshotCompletedEvent: 1,
        PageScreenshotEvent: 1,
      });
      assertSessionIds(events, agentV3.flowLoggerContext.sessionId);
      expectRootEvent(root);
      expect(pageGoto.eventParentIds).toEqual([root.eventId]);
      expectDirectParent(pageGotoCompleted, pageGoto);
      expect(pageScreenshot.eventParentIds).toEqual([root.eventId]);
      expectDirectParent(pageScreenshotCompleted, pageScreenshot);
      expect(llmRequests).toHaveLength(3);
      expect(llmResponses).toHaveLength(3);

      for (const event of [...llmRequests, ...llmResponses]) {
        expect(event.eventParentIds).toEqual([root.eventId]);
      }

      assertNoFloatingLlmEvents(events);
      assertNoFloatingCdpEvents(events);
    } finally {
      await closeV3(agentV3);
    }

    const directV3 = createRecordedFlowLoggerV3();
    await directV3.init();

    try {
      const page = directV3.context.pages()[0];
      const baseline = await captureFlowEventBaseline(directV3);

      await page.goto(agentPageUrl);
      await page.screenshot({ fullPage: false });

      const events = await listRecordedFlowEventsSince(directV3, baseline);
      const pageGoto = requireSingleEvent(events, "PageGotoEvent");
      const pageGotoCompleted = requireSingleEvent(
        events,
        "PageGotoCompletedEvent",
      );
      const pageScreenshot = requireSingleEvent(events, "PageScreenshotEvent");
      const pageScreenshotCompleted = requireSingleEvent(
        events,
        "PageScreenshotCompletedEvent",
      );

      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        PageGotoCompletedEvent: 1,
        PageGotoEvent: 1,
        PageScreenshotCompletedEvent: 1,
        PageScreenshotEvent: 1,
      });
      assertSessionIds(events, directV3.flowLoggerContext.sessionId);
      expectRootEvent(pageGoto);
      expectDirectParent(pageGotoCompleted, pageGoto);
      expectRootEvent(pageScreenshot);
      expectDirectParent(pageScreenshotCompleted, pageScreenshot);
      expect(eventsOfType(events, "LlmRequestEvent")).toHaveLength(0);
      expect(eventsOfType(events, "LlmResponseEvent")).toHaveLength(0);
      assertNoFloatingCdpEvents(events);
    } finally {
      await closeV3(directV3);
    }
  });

  test("direct page methods, direct understudy calls, and direct sendCDP all attach complete event trees to the session", async () => {
    const v3 = createRecordedFlowLoggerV3();
    await v3.init();

    try {
      const page = v3.context.pages()[0];
      await page.goto(
        encodeHtml(`
          <!doctype html>
          <html>
            <body>
              <button
                id="direct-click"
                onclick="document.body.dataset.directClick='true'"
              >
                Direct Click
              </button>
              <div id="ready">ready</div>
            </body>
          </html>
        `),
      );

      let baseline = await captureFlowEventBaseline(v3);
      await page.evaluate(() => document.getElementById("ready")?.textContent);
      let events = await listRecordedFlowEventsSince(v3, baseline);
      let root = assertCompletedEnvelope(events, "PageEvaluateEvent");
      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        PageEvaluateCompletedEvent: 1,
        PageEvaluateEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(root);
      expect(eventsOfType(events, "LlmRequestEvent")).toHaveLength(0);
      expect(eventsOfType(events, "LlmResponseEvent")).toHaveLength(0);
      assertNoFloatingCdpEvents(events);

      baseline = await captureFlowEventBaseline(v3);
      await page.snapshot();
      events = await listRecordedFlowEventsSince(v3, baseline);
      root = assertCompletedEnvelope(events, "PageSnapshotEvent");
      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        PageSnapshotCompletedEvent: 1,
        PageSnapshotEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(root);
      expect(eventsOfType(events, "LlmRequestEvent")).toHaveLength(0);
      expect(eventsOfType(events, "LlmResponseEvent")).toHaveLength(0);
      assertNoFloatingCdpEvents(events);

      baseline = await captureFlowEventBaseline(v3);
      await performUnderstudyMethod(
        page,
        page.mainFrame(),
        "click",
        "/html/body/button",
        [],
        30_000,
      );
      events = await listRecordedFlowEventsSince(v3, baseline);
      root = assertCompletedEnvelope(events, "UnderstudyClickEvent");
      assertAllParentIdsResolve(events);
      assertNonCdpEventCounts(events, {
        UnderstudyClickCompletedEvent: 1,
        UnderstudyClickEvent: 1,
      });
      assertSessionIds(events, v3.flowLoggerContext.sessionId);
      expectRootEvent(root);
      expect(eventsOfType(events, "LlmRequestEvent")).toHaveLength(0);
      expect(eventsOfType(events, "LlmResponseEvent")).toHaveLength(0);
      assertNoFloatingCdpEvents(events);
      expect(
        await page.evaluate(() => document.body.dataset.directClick ?? ""),
      ).toBe("true");

      baseline = await captureFlowEventBaseline(v3);
      const cdpResult = await page.sendCDP<{
        result?: { value?: number };
      }>("Runtime.evaluate", {
        expression: "2 + 2",
        returnByValue: true,
      });
      events = await listRecordedFlowEventsSince(v3, baseline);
      expect(cdpResult.result?.value).toBe(4);
      expect(eventsOfType(events, "LlmRequestEvent")).toHaveLength(0);
      expect(eventsOfType(events, "LlmResponseEvent")).toHaveLength(0);
      assertAllParentIdsResolve(events);
      assertDirectRootCdpEvents(events, v3.flowLoggerContext.sessionId);
    } finally {
      await closeV3(v3);
    }
  });
});


================================================
FILE: packages/core/tests/integration/frame-get-location-and-click.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Coordinate-based clicking", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("clicking by coordinates toggles a button state", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <button id="btn" onclick="this.dataset.clicked = (this.dataset.clicked==='1'?'0':'1')">Click</button>
            <div id="out"></div>
            <script>
              const btn = document.getElementById('btn');
              const out = document.getElementById('out');
              const update = () => { out.textContent = btn.dataset.clicked === '1' ? 'clicked' : 'idle'; };
              update();
              btn.addEventListener('click', update);
            </script>
          </body></html>`,
        ),
    );

    // Initial state should be idle
    let state = await page.mainFrame().evaluate(() => {
      const out = document.getElementById("out");
      return out?.textContent || "";
    });
    expect(state).toBe("idle");

    // Compute button location via Frame.getLocationForSelector
    const { x, y, width, height } = await page
      .mainFrame()
      .getLocationForSelector("#btn");

    // Click near the center of the button using Page.click coordinates
    const cx = Math.round(x + width / 2);
    const cy = Math.round(y + height / 2);
    await page.click(cx, cy);

    state = await page.mainFrame().evaluate(() => {
      const out = document.getElementById("out");
      return out?.textContent || "";
    });
    expect(state).toBe("clicked");

    // Click again to toggle back to idle
    await page.click(cx, cy);
    state = await page.mainFrame().evaluate(() => {
      const out = document.getElementById("out");
      return out?.textContent || "";
    });
    expect(state).toBe("idle");
  });
});


================================================
FILE: packages/core/tests/integration/iframe-ctx-addInitScript-race.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import type { V3Context } from "../../lib/v3/understudy/context.js";
import type { Page } from "../../lib/v3/understudy/page.js";

const DEFAULT_INIT_SCRIPT_DELAY_MS = 250;
const INIT_SCRIPT_DELAY_MS = (() => {
  const rawValue = process.env.IFRAME_INIT_SCRIPT_SEND_DELAY_MS;
  if (rawValue === undefined) return DEFAULT_INIT_SCRIPT_DELAY_MS;
  const parsed = Number(rawValue);
  if (!Number.isFinite(parsed) || parsed <= 0)
    return DEFAULT_INIT_SCRIPT_DELAY_MS;
  return parsed;
})();

const POPUP_TIMEOUT_MS = 20_000;
const RACE_INIT_SCRIPT_SENTINEL = "__stagehand_init_script_race_sentinel__";
const INIT_SCRIPT_MARKER_KEY = "__stagehand_init_script_loaded__";
const POPUP_URL = "https://example.com/";
const POPUP_IFRAME_URL = "https://example.org/";

const INIT_SCRIPT_SOURCE = `
(() => {
  /* ${RACE_INIT_SCRIPT_SENTINEL} */
  window["${INIT_SCRIPT_MARKER_KEY}"] = true;
})();
`;

type PatchedConn = {
  _sendViaSession: (
    sessionId: string,
    method: string,
    params?: object,
  ) => Promise<unknown>;
};

type SessionCommandRecord = {
  sequence: number;
  sessionId: string;
  method: string;
  isRaceInitScript: boolean;
};

type PopupTriggerCase = {
  name: string;
  prepare: (opener: Page) => Promise<void>;
};

async function closeAllPages(ctx: V3Context): Promise<void> {
  const pages = ctx.pages();
  await Promise.allSettled(pages.map((page) => page.close()));
}

async function waitForPopupPage(
  ctx: V3Context,
  knownTargetIds: Set<string>,
  timeoutMs = POPUP_TIMEOUT_MS,
): Promise<Page> {
  const deadline = Date.now() + timeoutMs;

  while (Date.now() < deadline) {
    const popup = ctx
      .pages()
      .find((candidate) => !knownTargetIds.has(candidate.targetId()));
    if (popup) return popup;
    try {
      const active = await ctx.awaitActivePage(500);
      if (!knownTargetIds.has(active.targetId())) return active;
    } catch {
      // keep polling
    }
    await new Promise((resolve) => setTimeout(resolve, 50));
  }

  throw new Error("Timed out waiting for popup page");
}

async function waitForChildFrame(
  page: Page,
  expectedUrl: string,
  timeoutMs = POPUP_TIMEOUT_MS,
): Promise<ReturnType<Page["frames"]>[number]> {
  const mainFrameId = page.mainFrame().frameId;
  const deadline = Date.now() + timeoutMs;

  while (Date.now() < deadline) {
    for (const frame of page.frames()) {
      if (frame.frameId === mainFrameId) continue;
      try {
        const href = await frame.evaluate(() => window.location.href);
        if (href === expectedUrl) return frame;
      } catch {
        // frame context may not be ready yet
      }
    }
    await new Promise((resolve) => setTimeout(resolve, 50));
  }

  throw new Error("Timed out waiting for child frame");
}

async function prepareTargetBlankPopupOpener(opener: Page): Promise<void> {
  await opener.goto("about:blank", { waitUntil: "domcontentloaded" });
  await opener.mainFrame().evaluate((popupUrl) => {
    const link = document.createElement("a");
    link.id = "open-popup";
    link.target = "_blank";
    link.href = popupUrl;
    link.textContent = "open popup";
    document.body.appendChild(link);
  }, POPUP_URL);
}

async function prepareWindowOpenPopupOpener(opener: Page): Promise<void> {
  await opener.goto("about:blank", { waitUntil: "domcontentloaded" });
  await opener.mainFrame().evaluate((popupUrl) => {
    const button = document.createElement("button");
    button.id = "open-popup";
    button.textContent = "open popup";
    button.addEventListener("click", () => {
      window.open(popupUrl, "_blank");
    });
    document.body.appendChild(button);
  }, POPUP_URL);
}

const POPUP_TRIGGER_CASES: PopupTriggerCase[] = [
  {
    name: 'target="_blank" link click',
    prepare: prepareTargetBlankPopupOpener,
  },
  {
    name: "window.open from click handler",
    prepare: prepareWindowOpenPopupOpener,
  },
];

test.describe("repro: popup iframe addInitScript race under delayed CDP send", () => {
  test.describe.configure({ mode: "serial" });

  let restoreSend: (() => void) | undefined;
  let v3: V3 | undefined;
  let ctx: V3Context | undefined;
  let sequence = 0;
  let records: SessionCommandRecord[] = [];

  test.beforeAll(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
    ctx = v3.context;

    const conn = (ctx as unknown as { conn?: PatchedConn }).conn;
    if (!conn || typeof conn._sendViaSession !== "function") {
      throw new Error("Unable to access CDP connection for race repro patch");
    }

    const originalSendViaSession = conn._sendViaSession.bind(conn);
    conn._sendViaSession = function patchedSendViaSession(
      sessionId: string,
      method: string,
      params?: object,
    ) {
      const source =
        typeof (params as { source?: unknown } | undefined)?.source === "string"
          ? (params as { source: string }).source
          : "";
      const isRaceInitScript =
        method === "Page.addScriptToEvaluateOnNewDocument" &&
        source.includes(RACE_INIT_SCRIPT_SENTINEL);

      const sendNow = () => {
        records.push({
          sequence: ++sequence,
          sessionId,
          method,
          isRaceInitScript,
        });
        return originalSendViaSession(sessionId, method, params);
      };

      if (isRaceInitScript && INIT_SCRIPT_DELAY_MS > 0) {
        return new Promise((resolve, reject) => {
          setTimeout(() => {
            sendNow().then(resolve, reject);
          }, INIT_SCRIPT_DELAY_MS);
        });
      }

      return sendNow();
    };

    restoreSend = () => {
      conn._sendViaSession = originalSendViaSession;
    };

    await ctx.addInitScript(INIT_SCRIPT_SOURCE);
  });

  test.afterAll(async () => {
    restoreSend?.();
    await v3?.close?.().catch(() => {});
  });

  test.beforeEach(async () => {
    records = [];
    sequence = 0;
    if (!ctx) return;
    await closeAllPages(ctx);
  });

  test.afterEach(async () => {
    if (!ctx) return;
    await closeAllPages(ctx);
  });

  for (const popupCase of POPUP_TRIGGER_CASES) {
    test(`should send addScript before resume for popup targets via ${popupCase.name}`, async () => {
      if (!ctx) throw new Error("Context not initialized");

      const opener = await ctx.newPage();
      await popupCase.prepare(opener);

      const knownTargetIds = new Set(ctx.pages().map((p) => p.targetId()));
      const knownSessionIds = new Set(
        records.map((record) => record.sessionId),
      );

      await opener.locator("#open-popup").click();

      const popup = await waitForPopupPage(ctx, knownTargetIds);
      await popup.waitForLoadState("load", POPUP_TIMEOUT_MS);
      await popup.mainFrame().evaluate((iframeUrl) => {
        const iframe = document.createElement("iframe");
        iframe.id = "race-child-iframe";
        iframe.src = iframeUrl;
        document.body.appendChild(iframe);
      }, POPUP_IFRAME_URL);
      const iframe = await waitForChildFrame(
        popup,
        POPUP_IFRAME_URL,
        POPUP_TIMEOUT_MS,
      );

      const popupInitScriptMarker = await popup.mainFrame().evaluate((key) => {
        return Boolean(Reflect.get(window, key));
      }, INIT_SCRIPT_MARKER_KEY);
      const iframeInitScriptMarker = await iframe.evaluate((key) => {
        return Boolean(Reflect.get(window, key));
      }, INIT_SCRIPT_MARKER_KEY);

      const perSession = new Map<
        string,
        {
          raceInitScriptSequence?: number;
          resumeSequence?: number;
        }
      >();

      for (const record of records) {
        if (knownSessionIds.has(record.sessionId)) continue;
        const entry = perSession.get(record.sessionId) ?? {};
        if (
          record.isRaceInitScript &&
          entry.raceInitScriptSequence === undefined
        ) {
          entry.raceInitScriptSequence = record.sequence;
        }
        if (
          record.method === "Runtime.runIfWaitingForDebugger" &&
          entry.resumeSequence === undefined
        ) {
          entry.resumeSequence = record.sequence;
        }
        perSession.set(record.sessionId, entry);
      }

      const comparableSessions = [...perSession.entries()]
        .map(([sessionId, entry]) => ({ sessionId, ...entry }))
        .filter(
          (entry) =>
            entry.raceInitScriptSequence !== undefined &&
            entry.resumeSequence !== undefined,
        );
      expect(comparableSessions.length).toBeGreaterThan(0);

      const orderingViolations = comparableSessions.filter((entry) => {
        return (
          (entry.raceInitScriptSequence as number) >
          (entry.resumeSequence as number)
        );
      });

      expect(
        orderingViolations,
        `Expected addScript before resume for ${popupCase.name}. initScriptDelayMs=${INIT_SCRIPT_DELAY_MS}; comparableSessions=${JSON.stringify(comparableSessions)}`,
      ).toEqual([]);
      expect(popupInitScriptMarker).toBe(true);
      expect(iframeInitScriptMarker).toBe(true);
    });
  }
});


================================================
FILE: packages/core/tests/integration/iframe-ctx-addInitScript.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { V3Context } from "../../lib/v3/understudy/context.js";
import type { Page } from "../../lib/v3/understudy/page.js";

const isBrowserbase =
  (process.env.STAGEHAND_BROWSER_TARGET ?? "local").toLowerCase() ===
  "browserbase";
const MIN_TIMEOUT_MS = 3_000;
const MAX_TIMEOUT_MS = 120_000;

const parseBoundedTimeoutMs = (
  value: string | undefined,
  fallbackMs: number,
): number => {
  const parsed = Number(value ?? fallbackMs);
  if (!Number.isFinite(parsed)) return fallbackMs;
  return Math.max(MIN_TIMEOUT_MS, Math.min(MAX_TIMEOUT_MS, parsed));
};

const CHILD_FRAME_TIMEOUT_MS = parseBoundedTimeoutMs(
  process.env.IFRAME_CHILD_FRAME_TIMEOUT_MS,
  isBrowserbase ? 80_000 : 40_000,
);
const POPUP_TIMEOUT_MS = parseBoundedTimeoutMs(
  process.env.IFRAME_POPUP_TIMEOUT_MS,
  isBrowserbase ? 60_000 : 40_000,
);
const POPUP_URL_TIMEOUT_MS = parseBoundedTimeoutMs(
  process.env.IFRAME_POPUP_URL_TIMEOUT_MS,
  isBrowserbase ? 80_000 : 40_000,
);
const DEBUG_INTERVAL_MS = 5_000;
const iframeDebugEnabled = isBrowserbase || process.env.IFRAME_DEBUG === "1";
const TEST_VIEWPORT = { width: 1288, height: 711 };

type FrameTreeNode = {
  frame: { id: string; parentId?: string; url?: string };
  childFrames?: FrameTreeNode[];
};
type ChildFrame = ReturnType<Page["frames"]>[number];
type ChildFrameProbe = {
  child: ChildFrame;
  href?: string;
  readyState?: DocumentReadyState;
  error?: string;
};

const formatError = (error: unknown): string => {
  if (error instanceof Error) return error.message;
  return String(error);
};

const flattenFrameTree = (
  node: FrameTreeNode,
  out: Array<{ id: string; parentId: string | null; url: string }> = [],
): Array<{ id: string; parentId: string | null; url: string }> => {
  out.push({
    id: node.frame.id,
    parentId: node.frame.parentId ?? null,
    url: node.frame.url ?? "",
  });
  for (const child of node.childFrames ?? []) {
    flattenFrameTree(child, out);
  }
  return out;
};

function debugLog(
  step: string,
  payload?: Record<string, unknown> | string,
): void {
  if (!iframeDebugEnabled) return;
  if (payload === undefined) {
    console.log(`[iframe-debug] ${step}`);
    return;
  }
  if (typeof payload === "string") {
    console.log(`[iframe-debug] ${step}: ${payload}`);
    return;
  }
  try {
    console.log(`[iframe-debug] ${step}: ${JSON.stringify(payload)}`);
  } catch {
    console.log(`[iframe-debug] ${step}: <unserializable payload>`);
  }
}

async function collectFrameSnapshot(
  page: Page,
): Promise<Array<Record<string, unknown>>> {
  const known = new Map<string, ReturnType<Page["frames"]>[number]>();
  known.set(page.mainFrame().frameId, page.mainFrame());
  for (const frame of page.frames()) known.set(frame.frameId, frame);

  return Promise.all(
    [...known.values()].map(async (frame) => {
      try {
        const state = await frame.evaluate(() => {
          return {
            href: location.href,
            readyState: document.readyState,
            visibilityState: document.visibilityState,
            iframeCount: document.querySelectorAll("iframe").length,
            hasShadowHost: Boolean(document.querySelector("shadow-host")),
          };
        });
        return {
          frameId: frame.frameId,
          sessionId: frame.sessionId ?? "root",
          ...state,
        };
      } catch (error) {
        return {
          frameId: frame.frameId,
          sessionId: frame.sessionId ?? "root",
          error: formatError(error),
        };
      }
    }),
  );
}

async function logPageDiagnostics(
  page: Page,
  reason: string,
  markerSelector?: string,
): Promise<void> {
  if (!iframeDebugEnabled) return;
  const diagnostics: Record<string, unknown> = {
    reason,
    pageUrl: page.url(),
    mainFrameId: page.mainFrame().frameId,
    knownFrameCount: page.frames().length,
  };

  try {
    const domState = await page.mainFrame().evaluate((marker) => {
      const el = marker ? document.querySelector(marker) : null;
      const rect =
        el instanceof Element ? el.getBoundingClientRect().toJSON() : null;
      return {
        href: location.href,
        readyState: document.readyState,
        visibilityState: document.visibilityState,
        hidden: document.hidden,
        hasFocus: document.hasFocus(),
        innerWidth: window.innerWidth,
        innerHeight: window.innerHeight,
        devicePixelRatio: window.devicePixelRatio,
        markerSelector: marker,
        markerPresent: Boolean(el),
        markerRect: rect,
        iframeCount: document.querySelectorAll("iframe").length,
      };
    }, markerSelector);
    diagnostics.domState = domState;
  } catch (error) {
    diagnostics.domStateError = formatError(error);
  }

  try {
    const frameTreeResponse = (await page.sendCDP("Page.getFrameTree")) as {
      frameTree?: FrameTreeNode;
    };
    if (frameTreeResponse.frameTree) {
      diagnostics.cdpFrameTree = flattenFrameTree(frameTreeResponse.frameTree);
    }
  } catch (error) {
    diagnostics.cdpFrameTreeError = formatError(error);
  }

  diagnostics.frameSnapshot = await collectFrameSnapshot(page);
  debugLog("page-diagnostics", diagnostics);
}

async function closeAllPages(ctx: V3Context): Promise<void> {
  const pages = ctx.pages();
  await Promise.allSettled(pages.map((page) => page.close()));
}

/**
 * Poll until a child frame (non-main) appears on `page` and its document
 * has finished loading.  Returns the child frame.
 */
async function waitForChildFrame(
  page: Page,
  expectedChildUrl: string,
  timeoutMs = CHILD_FRAME_TIMEOUT_MS,
): Promise<ChildFrame> {
  const mainFrameId = page.mainFrame().frameId;
  const deadline = Date.now() + timeoutMs;
  let observedFrameCount = 0;
  const observedChildFrameIds = new Set<string>();
  let lastUrl = "";
  let lastLogAt = Date.now();

  while (Date.now() < deadline) {
    const frames = page.frames();
    observedFrameCount = Math.max(observedFrameCount, frames.length);
    lastUrl = page.url();
    const childIds = frames
      .filter((f) => f.frameId !== mainFrameId)
      .map((f) => f.frameId);
    if (iframeDebugEnabled && Date.now() - lastLogAt >= DEBUG_INTERVAL_MS) {
      debugLog("waitForChildFrame:progress", {
        url: lastUrl,
        mainFrameId,
        observedFrameCount,
        childIds,
        expectedChildUrl,
      });
      lastLogAt = Date.now();
    }
    for (const childId of childIds) observedChildFrameIds.add(childId);

    const childFrames = frames
      .filter((f) => f.frameId !== mainFrameId)
      // Prefer recently-discovered frames first; stale swapped frame ids
      // can remain visible in the registry while the live OOPIF is ready.
      .reverse();

    if (childFrames.length) {
      const probes = await Promise.all(
        childFrames.map(async (child): Promise<ChildFrameProbe> => {
          try {
            const state = await child.evaluate(
              (): { href: string; readyState: DocumentReadyState } => ({
                href: location.href,
                readyState: document.readyState,
              }),
            );
            return {
              child,
              href: state.href,
              readyState: state.readyState,
            };
          } catch (error) {
            const failedProbe: ChildFrameProbe = {
              child,
              href: undefined,
              readyState: undefined,
              error: formatError(error),
            };
            return failedProbe;
          }
        }),
      );

      const ready = probes.find(
        (probe) =>
          probe.readyState === "complete" && probe.href === expectedChildUrl,
      );
      if (ready) {
        debugLog("waitForChildFrame:ready", {
          childFrameId: ready.child.frameId,
          childSessionId: ready.child.sessionId ?? "root",
          childUrl: ready.href ?? "<unknown>",
          expectedChildUrl,
          url: lastUrl,
        });
        return ready.child;
      }

      if (iframeDebugEnabled && Date.now() - lastLogAt >= DEBUG_INTERVAL_MS) {
        debugLog("waitForChildFrame:not-ready", {
          url: lastUrl,
          mainFrameId,
          expectedChildUrl,
          probes: probes.map((probe) => ({
            frameId: probe.child.frameId,
            sessionId: probe.child.sessionId ?? "root",
            readyState: probe.readyState ?? "<unknown>",
            href: probe.href ?? "<unknown>",
            error: probe.error ?? "<none>",
          })),
        });
        lastLogAt = Date.now();
      }
    }
    await new Promise((r) => setTimeout(r, 100));
  }
  await logPageDiagnostics(page, "waitForChildFrame timeout");
  throw new Error(
    `Timed out waiting for child frame to load (timeout=${timeoutMs}ms, mainFrameId=${mainFrameId}, expectedChildUrl=${expectedChildUrl}, maxObservedFrames=${observedFrameCount}, observedChildFrameIds=[${[...observedChildFrameIds].join(",")}], url=${lastUrl || "<unknown>"})`,
  );
}

async function waitForPageUrl(
  page: Page,
  expectedUrlSubstring: string,
  timeoutMs = POPUP_URL_TIMEOUT_MS,
): Promise<void> {
  const deadline = Date.now() + timeoutMs;
  let lastUrl = "";
  let lastLogAt = Date.now();
  while (Date.now() < deadline) {
    lastUrl = page.url();
    if (iframeDebugEnabled && Date.now() - lastLogAt >= DEBUG_INTERVAL_MS) {
      debugLog("waitForPageUrl:progress", {
        expectedUrlSubstring,
        lastUrl,
      });
      lastLogAt = Date.now();
    }
    if (lastUrl.includes(expectedUrlSubstring)) {
      debugLog("waitForPageUrl:ready", {
        expectedUrlSubstring,
        lastUrl,
      });
      return;
    }
    await new Promise((r) => setTimeout(r, 100));
  }
  await logPageDiagnostics(
    page,
    `waitForPageUrl timeout for ${expectedUrlSubstring}`,
  );
  throw new Error(
    `Timed out waiting for popup URL to include "${expectedUrlSubstring}" (timeout=${timeoutMs}ms, lastUrl=${lastUrl || "<unknown>"})`,
  );
}

async function preparePopupForFrameAttach(
  page: Page,
  markerSelector: string,
  timeoutMs = CHILD_FRAME_TIMEOUT_MS,
): Promise<void> {
  debugLog("preparePopupForFrameAttach:start", {
    markerSelector,
    timeoutMs,
    url: page.url(),
  });
  await page.waitForLoadState("domcontentloaded", timeoutMs);
  await page.waitForSelector(markerSelector, {
    state: "attached",
    timeout: timeoutMs,
  });
  await page.mainFrame().evaluate(() => {
    const host = document.querySelector("shadow-host");
    if (host instanceof HTMLElement) {
      host.scrollIntoView({ block: "center", inline: "center" });
    } else {
      window.scrollTo(0, document.body.scrollHeight);
      window.scrollTo(0, 0);
    }
    window.dispatchEvent(new Event("scroll"));
  });
  await logPageDiagnostics(
    page,
    "preparePopupForFrameAttach:ready",
    markerSelector,
  );
}

async function ensurePopupViewport(page: Page): Promise<void> {
  await page.setViewportSize(TEST_VIEWPORT.width, TEST_VIEWPORT.height);
  await logPageDiagnostics(page, "ensurePopupViewport");
}

async function waitForPopupPage(
  ctx: V3Context,
  opener: Page,
  timeoutMs = POPUP_TIMEOUT_MS,
): Promise<Page> {
  const openerMainFrameId = opener.mainFrame().frameId;
  const deadline = Date.now() + timeoutMs;
  let lastLogAt = Date.now();

  while (Date.now() < deadline) {
    const pages = ctx.pages();
    const popup = pages.find((candidate) => {
      return candidate.mainFrame().frameId !== openerMainFrameId;
    });
    if (popup) {
      debugLog("waitForPopupPage:found", {
        openerMainFrameId,
        popupMainFrameId: popup.mainFrame().frameId,
        popupUrl: popup.url(),
      });
      return popup;
    }

    if (iframeDebugEnabled && Date.now() - lastLogAt >= DEBUG_INTERVAL_MS) {
      debugLog("waitForPopupPage:progress", {
        openerMainFrameId,
        observedPageIds: pages.map((p) => p.mainFrame().frameId),
      });
      lastLogAt = Date.now();
    }

    try {
      const active = await ctx.awaitActivePage(500);
      if (active.mainFrame().frameId !== openerMainFrameId) {
        debugLog("waitForPopupPage:active-non-opener", {
          openerMainFrameId,
          activeMainFrameId: active.mainFrame().frameId,
          activeUrl: active.url(),
        });
        return active;
      }
    } catch {
      // keep polling until timeout
    }

    await new Promise((r) => setTimeout(r, 100));
  }

  const pageIds = ctx
    .pages()
    .map((p) => p.mainFrame().frameId)
    .join(", ");
  throw new Error(
    `Timed out waiting for popup page (timeout=${timeoutMs}ms, openerMainFrameId=${openerMainFrameId}, observedPages=[${pageIds}])`,
  );
}

test.describe("context.addInitScript with iframes", () => {
  const OOPIF_CHILD_URL =
    "https://seanmcguire12.github.io/stagehand-oopif-sites/sites/form-filling/";
  const SPIF_CHILD_URL =
    "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-closed-shadow-dom/iframe.html";
  const POPUP_SPIF_CHILD_URL =
    "https://browserbase.github.io/stagehand-eval-sites/sites/closed-shadow-dom-in-spif/embedded.html";

  if (isBrowserbase) {
    test.describe.configure({ mode: "serial" });
  }

  let v3: V3;
  let ctx: V3Context;

  test.beforeAll(async () => {
    debugLog("beforeAll:config", {
      browserTarget: process.env.STAGEHAND_BROWSER_TARGET ?? "local",
      childFrameTimeoutMs: CHILD_FRAME_TIMEOUT_MS,
      popupTimeoutMs: POPUP_TIMEOUT_MS,
      popupUrlTimeoutMs: POPUP_URL_TIMEOUT_MS,
    });
    v3 = new V3(v3TestConfig);
    await v3.init();
    ctx = v3.context;

    // Add init script that sets background to red
    await ctx.addInitScript(`
      (() => {
        document.addEventListener('DOMContentLoaded', () => {
          document.documentElement.style.backgroundColor = 'red';
        });
      })();
    `);
  });

  test.beforeEach(async () => {
    await closeAllPages(ctx);
  });

  test.afterEach(async () => {
    await closeAllPages(ctx);
  });

  test.afterAll(async () => {
    await v3?.close?.().catch(() => {});
  });

  test.describe("direct navigation", () => {
    test("with OOPIF - sets background red in main page and iframe", async () => {
      const page = await ctx.newPage();

      await page.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
        { waitUntil: "networkidle" },
      );

      const iframe = await waitForChildFrame(page, OOPIF_CHILD_URL);

      // Check main page background
      const mainBgColor = await page.mainFrame().evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(mainBgColor).toBe("rgb(255, 0, 0)");

      const iframeBgColor = await iframe.evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(iframeBgColor).toBe("rgb(255, 0, 0)");
    });

    test("with SPIF - sets background red in main page and iframe", async () => {
      const page = await ctx.newPage();

      await page.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-closed-shadow-dom/",
        { waitUntil: "networkidle" },
      );

      const iframe = await waitForChildFrame(page, SPIF_CHILD_URL);

      // Check main page background
      const mainBgColor = await page.mainFrame().evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(mainBgColor).toBe("rgb(255, 0, 0)");

      const iframeBgColor = await iframe.evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(iframeBgColor).toBe("rgb(255, 0, 0)");
    });
  });

  test.describe("via newPage", () => {
    test("with OOPIF - sets background red in main page and iframe", async () => {
      const page = await ctx.newPage();

      await page.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
        { waitUntil: "networkidle" },
      );

      const iframe = await waitForChildFrame(page, OOPIF_CHILD_URL);

      // Check main page background
      const mainBgColor = await page.mainFrame().evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(mainBgColor).toBe("rgb(255, 0, 0)");

      const iframeBgColor = await iframe.evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(iframeBgColor).toBe("rgb(255, 0, 0)");
    });

    test("with SPIF - sets background red in main page and iframe", async () => {
      const page = await ctx.newPage();

      await page.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-closed-shadow-dom/",
        { waitUntil: "networkidle" },
      );

      const iframe = await waitForChildFrame(page, SPIF_CHILD_URL);

      // Check main page background
      const mainBgColor = await page.mainFrame().evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(mainBgColor).toBe("rgb(255, 0, 0)");

      const iframeBgColor = await iframe.evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(iframeBgColor).toBe("rgb(255, 0, 0)");
    });
  });

  test.describe("via popup", () => {
    test("with OOPIF - sets background red in main page and iframe", async () => {
      const page = await ctx.newPage();

      await page.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/ctx-add-init-script-oopif/",
        { waitUntil: "networkidle" },
      );

      // Click link to open popup
      await page.locator("a").click();
      debugLog("popup-oopif:clicked-link", { openerUrl: page.url() });

      // Wait for popup to open and become active
      const popup = await waitForPopupPage(ctx, page);
      ctx.setActivePage(popup);
      await ensurePopupViewport(popup);
      await waitForPageUrl(
        popup,
        "/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
      );
      debugLog("popup-oopif:refresh-navigation", { url: popup.url() });
      await popup.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
        { waitUntil: "networkidle" },
      );
      await logPageDiagnostics(
        popup,
        "popup-oopif:after-refresh",
        "shadow-host",
      );
      await preparePopupForFrameAttach(popup, "shadow-host");
      const iframe = await waitForChildFrame(popup, OOPIF_CHILD_URL);

      // Check popup main page background
      const mainBgColor = await popup.mainFrame().evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(mainBgColor).toBe("rgb(255, 0, 0)");

      const iframeBgColor = await iframe.evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(iframeBgColor).toBe("rgb(255, 0, 0)");
    });

    test("with SPIF - sets background red in main page and iframe", async () => {
      const page = await ctx.newPage();

      await page.goto(
        "https://browserbase.github.io/stagehand-eval-sites/sites/ctx-add-init-script-spif/",
        { waitUntil: "networkidle" },
      );

      // Click link to open popup
      await page.locator("a").click();
      debugLog("popup-spif:clicked-link", { openerUrl: page.url() });

      // Wait for popup to open and become active
      const popup = await waitForPopupPage(ctx, page);
      ctx.setActivePage(popup);
      await ensurePopupViewport(popup);
      await waitForPageUrl(
        popup,
        "/stagehand-eval-sites/sites/closed-shadow-dom-in-spif/",
      );
      await preparePopupForFrameAttach(popup, "iframe");
      const iframe = await waitForChildFrame(popup, POPUP_SPIF_CHILD_URL);

      // Check popup main page background
      const mainBgColor = await popup.mainFrame().evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(mainBgColor).toBe("rgb(255, 0, 0)");

      const iframeBgColor = await iframe.evaluate(() => {
        return getComputedStyle(document.documentElement).backgroundColor;
      });
      expect(iframeBgColor).toBe("rgb(255, 0, 0)");
    });
  });
});


================================================
FILE: packages/core/tests/integration/keep-alive.child.ts
================================================
import { V3 } from "../../lib/v3/v3.js";

async function main(): Promise<void> {
  const encoded = process.argv.find((arg) => arg.startsWith("cfg:"));
  if (!encoded) {
    throw new Error("Missing child config payload.");
  }
  const raw = Buffer.from(encoded.slice(4), "base64").toString("utf8");
  const cfg = JSON.parse(raw) as {
    env: "LOCAL" | "BROWSERBASE";
    keepAlive: boolean;
    disableAPI: boolean;
    scenario: string;
    apiKey?: string;
    projectId?: string;
    debug?: boolean;
    viewMs?: number;
  };
  const {
    env,
    keepAlive,
    disableAPI,
    scenario,
    apiKey,
    projectId,
    debug = false,
    viewMs = 0,
  } = cfg;

  const log = (message: string): void => {
    if (debug) {
      console.log(message);
    }
  };

  if (env !== "LOCAL" && env !== "BROWSERBASE") {
    throw new Error("KEEP_ALIVE_ENV must be LOCAL or BROWSERBASE");
  }
  if (!scenario) {
    throw new Error("KEEP_ALIVE_SCENARIO is required");
  }

  log(
    `[keep-alive-child] env=${env} keepAlive=${keepAlive} disableAPI=${disableAPI} ` +
      `scenario=${scenario} apiKey=${apiKey ? "set" : "missing"} ` +
      `projectId=${projectId ? "set" : "missing"}`,
  );

  const showBrowser = viewMs > 0;
  const v3 = new V3({
    env,
    keepAlive,
    disableAPI,
    apiKey,
    projectId,
    browserbaseSessionCreateParams: undefined,
    localBrowserLaunchOptions:
      env === "LOCAL"
        ? {
            executablePath: process.env.CHROME_PATH,
            args: process.env.CI ? ["--no-sandbox"] : undefined,
            headless: !showBrowser,
            viewport: { width: 1288, height: 711 },
          }
        : undefined,
    verbose: debug ? 2 : 0,
    disablePino: true,
    logger: debug ? (line) => console.log(line) : undefined,
  });

  await v3.init();

  const info = {
    connectURL: v3.connectURL(),
    sessionId: v3.browserbaseSessionId ?? null,
  };
  await new Promise<void>((resolve, reject) => {
    process.stdout.write(`__KEEPALIVE__${JSON.stringify(info)}\n`, (error) => {
      if (error) {
        reject(error);
        return;
      }
      resolve();
    });
  });

  if (env === "LOCAL" && viewMs > 0) {
    await new Promise((r) => setTimeout(r, viewMs));
  }

  if (scenario === "close") {
    await v3.close().catch(() => {});
    process.exit(0);
  }

  if (scenario === "sigterm") {
    return;
  }

  if (scenario === "sigint") {
    return;
  }

  if (scenario === "unhandled") {
    setTimeout(() => {
      void Promise.reject(new Error("keepAlive unhandled rejection"));
    }, 0);
    return;
  }

  throw new Error(`Unknown scenario: ${scenario}`);
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});


================================================
FILE: packages/core/tests/integration/keep-alive.spec.ts
================================================
import { test } from "@playwright/test";
import { spawn } from "node:child_process";
import fs from "node:fs";
import Browserbase from "@browserbasehq/sdk";
import WebSocket from "ws";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { getPackageRootDir } from "../../lib/v3/runtimePaths.js";

export type EnvKind = "LOCAL" | "BROWSERBASE";
export type ScenarioKind = "unhandled" | "close" | "sigterm" | "sigint";

export type KeepAliveCase = {
  title: string;
  env: EnvKind;
  envLabel: string;
  keepAlive: boolean;
  disableAPI: boolean;
  kind: ScenarioKind;
  requiresBrowserbase: boolean;
};

type ScenarioConfig = {
  env: EnvKind;
  keepAlive: boolean;
  disableAPI: boolean;
  kind: ScenarioKind;
  debug: boolean;
  viewMs: number;
  apiKey?: string;
  projectId?: string;
};

type ChildInfo = {
  connectURL: string;
  sessionId: string | null;
};

type ChildLogs = {
  stdout: string[];
  stderr: string[];
};

type CheckResult = {
  alive: boolean;
  status?: string;
};

type Outcome = {
  expected: "open" | "closed";
  actual: "open" | "closed";
  durationMs: number;
  lastStatus?: string;
};

const coreDir = getPackageRootDir();

const resolveChildRunner = (): { command: string; args: string[] } | null => {
  const distJsPath = `${coreDir}/dist/esm/tests/integration/keep-alive.child.js`;
  if (fs.existsSync(distJsPath)) {
    return { command: process.execPath, args: [distJsPath] };
  }

  return null;
};

const childRunner = resolveChildRunner();

const DEBUG = process.env.KEEP_ALIVE_DEBUG === "1";
const VIEW_MS = Number(process.env.KEEP_ALIVE_VIEW_MS ?? "0");
const LOCAL_TIMEOUT_MS = Number(
  process.env.KEEP_ALIVE_LOCAL_TIMEOUT_MS ?? "8000",
);
const BB_TIMEOUT_MS = Number(process.env.KEEP_ALIVE_BB_TIMEOUT_MS ?? "30000");
const STAY_OPEN_MS = Number(process.env.KEEP_ALIVE_STAY_OPEN_MS ?? "6000");
const ACTION_EXIT_TIMEOUT_MS = Number(
  process.env.KEEP_ALIVE_ACTION_EXIT_TIMEOUT_MS ?? "3000",
);
const LOCAL_INFO_TIMEOUT_MS = Number(
  process.env.KEEP_ALIVE_LOCAL_INFO_TIMEOUT_MS ?? "15000",
);
const BB_INFO_TIMEOUT_MS = Number(
  process.env.KEEP_ALIVE_BB_INFO_TIMEOUT_MS ??
    (process.env.CI ? "45000" : "30000"),
);

const getInfoTimeoutMs = (env: EnvKind): number =>
  env === "BROWSERBASE" ? BB_INFO_TIMEOUT_MS : LOCAL_INFO_TIMEOUT_MS;

function debugLog(message: string): void {
  if (DEBUG) {
    console.log(message);
  }
}

function parseChildInfo(line: string): ChildInfo | null {
  const prefix = "__KEEPALIVE__";
  if (!line.startsWith(prefix)) return null;
  try {
    return JSON.parse(line.slice(prefix.length)) as ChildInfo;
  } catch {
    return null;
  }
}

async function runScenario(config: ScenarioConfig): Promise<{
  info: ChildInfo;
  child: ReturnType<typeof spawn>;
  logs: ChildLogs;
}> {
  const payload = {
    env: config.env,
    keepAlive: config.keepAlive,
    disableAPI: config.disableAPI,
    scenario: config.kind,
    apiKey: config.apiKey,
    projectId: config.projectId,
    debug: config.debug,
    viewMs: config.viewMs,
  };
  const encoded = `cfg:${Buffer.from(JSON.stringify(payload)).toString("base64")}`;

  if (!childRunner) {
    throw new Error(
      "keep-alive child script not found at dist/esm/tests/integration/keep-alive.child.js",
    );
  }

  const child = spawn(childRunner.command, [...childRunner.args, encoded], {
    cwd: coreDir,
    env: { ...process.env },
    stdio: ["ignore", "pipe", "pipe"],
  });

  const logs: ChildLogs = { stdout: [], stderr: [] };
  let buffer = "";
  let stderr = "";
  let resolved = false;
  const infoTimeoutMs = getInfoTimeoutMs(config.env);

  const infoPromise = new Promise<ChildInfo>((resolve, reject) => {
    const timeout = setTimeout(() => {
      child.kill("SIGKILL");
      const stdoutDetails =
        logs.stdout.length > 0
          ? `\nChild stdout:\n${logs.stdout.join("\n")}`
          : "";
      const details = stderr.trim();
      const suffix = details
        ? `\nChild stderr:\n${details}`
        : "\nChild did not emit keepAlive info.";
      reject(
        new Error(
          `Child timed out waiting for info after ${infoTimeoutMs}ms (env=${config.env}, keepAlive=${config.keepAlive}, disableAPI=${config.disableAPI}, scenario=${config.kind}).${suffix}${stdoutDetails}`,
        ),
      );
    }, infoTimeoutMs);

    child.stdout.on("data", (chunk) => {
      buffer += chunk.toString();
      let idx = buffer.indexOf("\n");
      while (idx !== -1) {
        const line = buffer.slice(0, idx).trim();
        buffer = buffer.slice(idx + 1);
        const parsed = parseChildInfo(line);
        if (parsed && !resolved) {
          resolved = true;
          clearTimeout(timeout);
          resolve(parsed);
        } else if (line.length > 0) {
          logs.stdout.push(line);
          debugLog(`[keep-alive-child] ${line}`);
        }
        idx = buffer.indexOf("\n");
      }
    });

    child.on("exit", (code, signal) => {
      if (resolved) return;
      clearTimeout(timeout);
      const stdoutDetails =
        logs.stdout.length > 0
          ? `\nChild stdout:\n${logs.stdout.join("\n")}`
          : "";
      const details = stderr.trim();
      const suffix = details
        ? `\nChild stderr:\n${details}`
        : "\nChild exited without emitting keepAlive info.";
      reject(
        new Error(
          `Child exited (code=${code ?? "null"}, signal=${signal ?? "null"}) before emitting keepAlive info (env=${config.env}, keepAlive=${config.keepAlive}, disableAPI=${config.disableAPI}, scenario=${config.kind}).${suffix}${stdoutDetails}`,
        ),
      );
    });

    child.on("error", (error) => {
      if (resolved) return;
      clearTimeout(timeout);
      reject(error);
    });
  });

  child.stderr.on("data", (chunk) => {
    const text = chunk.toString();
    stderr += text;
    const trimmed = text.trim();
    if (trimmed.length > 0) {
      logs.stderr.push(trimmed);
      debugLog(`[keep-alive-child] ${trimmed}`);
    }
  });

  const info = await infoPromise;
  return { info, child, logs };
}

async function stopChild(child: ReturnType<typeof spawn>): Promise<void> {
  if (child.exitCode !== null) return;
  try {
    child.kill("SIGKILL");
  } catch {
    return;
  }
  await new Promise<void>((resolve) => {
    const timer = setTimeout(() => resolve(), 2000);
    child.once("exit", () => {
      clearTimeout(timer);
      resolve();
    });
  });
}

async function waitForChildExit(
  child: ReturnType<typeof spawn>,
  timeoutMs: number,
): Promise<void> {
  if (child.exitCode !== null) return;
  await new Promise<void>((resolve) => {
    const timer = setTimeout(() => resolve(), timeoutMs);
    child.once("exit", () => {
      clearTimeout(timer);
      resolve();
    });
  });
}

async function checkLocalAlive(connectURL: string): Promise<CheckResult> {
  let port: string;
  try {
    port = new URL(connectURL).port;
  } catch {
    return { alive: false, status: "INVALID_URL" };
  }
  if (!port) return { alive: false, status: "MISSING_PORT" };

  const controller = new AbortController();
  const timer = setTimeout(() => controller.abort(), 1500);
  try {
    const resp = await fetch(`http://127.0.0.1:${port}/json/version`, {
      signal: controller.signal,
    });
    if (!resp.ok) {
      return { alive: false, status: `HTTP_${resp.status}` };
    }
    const json = (await resp.json()) as { webSocketDebuggerUrl?: string };
    const ws = json?.webSocketDebuggerUrl;
    if (!ws) {
      return { alive: false, status: "MISSING_WS" };
    }
    if (ws !== connectURL) {
      return { alive: false, status: "WS_MISMATCH" };
    }
    return { alive: true, status: "MATCH" };
  } catch {
    return { alive: false, status: "FETCH_ERROR" };
  } finally {
    clearTimeout(timer);
  }
}

async function closeLocalBrowser(connectURL: string): Promise<void> {
  await new Promise<void>((resolve) => {
    const ws = new WebSocket(connectURL);
    const timer = setTimeout(() => {
      ws.terminate();
      resolve();
    }, 2000);
    ws.on("open", () => {
      ws.send(JSON.stringify({ id: 1, method: "Browser.close" }));
    });
    ws.on("error", () => {
      clearTimeout(timer);
      resolve();
    });
    ws.on("close", () => {
      clearTimeout(timer);
      resolve();
    });
  });
}

async function checkBrowserbaseAlive(
  sessionId: string,
  apiKey?: string,
): Promise<CheckResult> {
  if (!apiKey) return { alive: false, status: "NO_API_KEY" };

  const bb = new Browserbase({ apiKey });
  try {
    const snapshot = (await bb.sessions.retrieve(sessionId)) as {
      status?: string;
    };
    if (DEBUG) {
      const status = snapshot?.status ?? "<missing>";
      debugLog(`[keep-alive] session ${sessionId} status=${status}`);
    }
    const status = snapshot?.status;
    return { alive: status === "RUNNING", status };
  } catch (error) {
    debugLog(
      `[keep-alive] session ${sessionId} retrieve failed: ${String(error)}`,
    );
    return { alive: false, status: "RETRIEVE_FAILED" };
  }
}

async function endBrowserbaseSession(
  sessionId: string,
  apiKey?: string,
  projectId?: string,
): Promise<void> {
  if (!apiKey || !projectId) return;
  const bb = new Browserbase({ apiKey });
  try {
    await bb.sessions.update(sessionId, {
      status: "REQUEST_RELEASE",
      projectId,
    });
  } catch {
    // best-effort cleanup
  }
}

async function assertStaysOpen(
  check: () => Promise<CheckResult>,
  durationMs: number,
  intervalMs = 500,
): Promise<{ durationMs: number; lastStatus?: string }> {
  const start = Date.now();
  const deadline = start + durationMs;
  let lastStatus: string | undefined;
  while (Date.now() < deadline) {
    const result = await check();
    lastStatus = result.status ?? lastStatus;
    if (!result.alive) {
      const elapsed = Date.now() - start;
      const status = lastStatus ? ` (last status ${lastStatus})` : "";
      throw new Error(
        `Browser closed after ${elapsed}ms (expected ${durationMs}ms)${status}.`,
      );
    }
    await new Promise((r) => setTimeout(r, intervalMs));
  }
  return { durationMs: Date.now() - start, lastStatus };
}

async function waitForClosed(
  check: () => Promise<CheckResult>,
  timeoutMs: number,
  intervalMs = 500,
): Promise<{ durationMs: number; lastStatus?: string }> {
  const start = Date.now();
  let lastStatus: string | undefined;
  while (Date.now() - start < timeoutMs) {
    const result = await check();
    lastStatus = result.status ?? lastStatus;
    if (!result.alive) {
      return { durationMs: Date.now() - start, lastStatus };
    }
    await new Promise((r) => setTimeout(r, intervalMs));
  }
  const status = lastStatus ? ` (last status ${lastStatus})` : "";
  throw new Error(`Browser still alive after ${timeoutMs}ms${status}.`);
}

async function assertBrowserState(
  env: EnvKind,
  info: ChildInfo,
  shouldStayOpen: boolean,
  apiKey?: string,
  projectId?: string,
): Promise<Outcome> {
  const expected: Outcome["expected"] = shouldStayOpen ? "open" : "closed";
  if (env === "LOCAL") {
    if (shouldStayOpen) {
      const result = await assertStaysOpen(
        () => checkLocalAlive(info.connectURL),
        STAY_OPEN_MS,
      );
      const outcome: Outcome = {
        expected,
        actual: "open",
        durationMs: result.durationMs,
        lastStatus: result.lastStatus,
      };
      await closeLocalBrowser(info.connectURL);
      return outcome;
    }

    const result = await waitForClosed(
      () => checkLocalAlive(info.connectURL),
      LOCAL_TIMEOUT_MS,
    );
    return {
      expected,
      actual: "closed",
      durationMs: result.durationMs,
      lastStatus: result.lastStatus,
    };
  }

  if (!info.sessionId) {
    throw new Error("Browserbase sessionId missing");
  }

  if (shouldStayOpen) {
    const result = await assertStaysOpen(
      () => checkBrowserbaseAlive(info.sessionId!, apiKey),
      STAY_OPEN_MS,
      1000,
    );
    const outcome: Outcome = {
      expected,
      actual: "open",
      durationMs: result.durationMs,
      lastStatus: result.lastStatus,
    };
    await endBrowserbaseSession(info.sessionId, apiKey, projectId);
    return outcome;
  }

  const result = await waitForClosed(
    () => checkBrowserbaseAlive(info.sessionId!, apiKey),
    BB_TIMEOUT_MS,
    1000,
  );
  return {
    expected,
    actual: "closed",
    durationMs: result.durationMs,
    lastStatus: result.lastStatus,
  };
}

function dumpLogs(logs: ChildLogs): void {
  if (logs.stdout.length > 0) {
    console.log("[keep-alive] child stdout:");
    for (const line of logs.stdout) {
      console.log(`  ${line}`);
    }
  }
  if (logs.stderr.length > 0) {
    console.log("[keep-alive] child stderr:");
    for (const line of logs.stderr) {
      console.log(`  ${line}`);
    }
  }
}

function logCaseResult(
  label: string,
  envLabel: string,
  keepAlive: boolean,
  outcome?: Outcome,
  error?: Error,
): void {
  const prefix = `[keep-alive] ${envLabel} keepAlive=${keepAlive} ${label}`;
  if (error) {
    console.log(`${prefix} FAIL: ${error.message}`);
    return;
  }
  if (!outcome) {
    console.log(`${prefix} FAIL: missing outcome`);
    return;
  }
  const status =
    outcome.lastStatus !== undefined
      ? ` (last status ${outcome.lastStatus})`
      : "";
  if (outcome.actual === "open") {
    console.log(
      `${prefix} PASS: stayed open for ${outcome.durationMs}ms${status}`,
    );
  } else {
    console.log(
      `${prefix} PASS: closed after ${outcome.durationMs}ms${status}`,
    );
  }
}

export function getKeepAliveEnvConfig(): {
  testEnv: EnvKind;
  apiKey?: string;
  projectId?: string;
  hasBrowserbaseCreds: boolean;
} {
  const testEnv = v3DynamicTestConfig.env;
  const apiKey =
    testEnv === "BROWSERBASE"
      ? (v3DynamicTestConfig.apiKey as string | undefined)
      : undefined;
  const projectId =
    testEnv === "BROWSERBASE"
      ? (v3DynamicTestConfig.projectId as string | undefined)
      : undefined;
  const hasBrowserbaseCreds = Boolean(apiKey && projectId);
  return { testEnv, apiKey, projectId, hasBrowserbaseCreds };
}

export function buildKeepAliveCases(testEnv: EnvKind): KeepAliveCase[] {
  const scenarios: Array<{ kind: ScenarioKind; label: string }> = [
    { kind: "unhandled", label: "unhandled rejection" },
    { kind: "close", label: "stagehand.close()" },
    { kind: "sigterm", label: "SIGTERM" },
    { kind: "sigint", label: "SIGINT" },
  ];

  const environments: Array<{
    env: EnvKind;
    label: string;
    disableAPI: boolean;
    requiresBrowserbase: boolean;
  }> =
    testEnv === "BROWSERBASE"
      ? [
          {
            env: "BROWSERBASE",
            label: "bb direct ws",
            disableAPI: true,
            requiresBrowserbase: true,
          },
          {
            env: "BROWSERBASE",
            label: "bb via api",
            disableAPI: false,
            requiresBrowserbase: true,
          },
        ]
      : [
          {
            env: "LOCAL",
            label: "local",
            disableAPI: false,
            requiresBrowserbase: false,
          },
        ];

  const cases: KeepAliveCase[] = [];
  for (const keepAlive of [true, false]) {
    for (const envConfig of environments) {
      for (const scenario of scenarios) {
        const expectation = keepAlive ? "expect open" : "expect closed";
        cases.push({
          title: `${envConfig.label} keepAlive=${keepAlive} ${scenario.label} (${expectation})`,
          env: envConfig.env,
          envLabel: envConfig.label,
          keepAlive,
          disableAPI: envConfig.disableAPI,
          kind: scenario.kind,
          requiresBrowserbase: envConfig.requiresBrowserbase,
        });
      }
    }
  }
  return cases;
}

export async function runKeepAliveCase(
  testCase: KeepAliveCase,
  envConfig: {
    apiKey?: string;
    projectId?: string;
  },
): Promise<void> {
  let info: ChildInfo | undefined;
  let child: ReturnType<typeof spawn> | undefined;
  let logs: ChildLogs | undefined;
  try {
    ({ info, child, logs } = await runScenario({
      env: testCase.env,
      keepAlive: testCase.keepAlive,
      disableAPI: testCase.disableAPI,
      kind: testCase.kind,
      debug: DEBUG,
      viewMs: VIEW_MS,
      apiKey: envConfig.apiKey,
      projectId: envConfig.projectId,
    }));
  } catch (error) {
    logCaseResult(
      testCase.title,
      testCase.envLabel,
      testCase.keepAlive,
      undefined,
      error as Error,
    );
    throw error;
  }

  if (testCase.kind === "sigterm") {
    child.kill("SIGTERM");
  } else if (testCase.kind === "sigint") {
    child.kill("SIGINT");
  }

  let outcome: Outcome | undefined;
  let failure: Error | undefined;
  try {
    if (
      testCase.kind === "close" ||
      testCase.kind === "unhandled" ||
      testCase.kind === "sigterm" ||
      testCase.kind === "sigint"
    ) {
      await waitForChildExit(child, ACTION_EXIT_TIMEOUT_MS);
    }
    outcome = await assertBrowserState(
      testCase.env,
      info,
      testCase.keepAlive,
      envConfig.apiKey,
      envConfig.projectId,
    );
  } catch (error) {
    failure = error as Error;
    if (logs) {
      dumpLogs(logs);
    }
    throw error;
  } finally {
    logCaseResult(
      testCase.title,
      testCase.envLabel,
      testCase.keepAlive,
      outcome,
      failure,
    );
    await stopChild(child);
    if (testCase.env === "LOCAL" && info.connectURL) {
      await closeLocalBrowser(info.connectURL);
    }
    if (testCase.env === "BROWSERBASE" && info.sessionId) {
      await endBrowserbaseSession(
        info.sessionId,
        envConfig.apiKey,
        envConfig.projectId,
      );
    }
  }
}

test.describe.parallel("keepAlive behavior", () => {
  const { testEnv, apiKey, projectId, hasBrowserbaseCreds } =
    getKeepAliveEnvConfig();
  const cases = buildKeepAliveCases(testEnv);

  for (const testCase of cases) {
    test(testCase.title, async () => {
      if (testCase.requiresBrowserbase) {
        test.skip(!hasBrowserbaseCreds, "Browserbase credentials required");
      }

      await runKeepAliveCase(testCase, { apiKey, projectId });
    });
  }
});


================================================
FILE: packages/core/tests/integration/keyboard.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

function dataUrl(html: string): string {
  return "data:text/html;charset=utf-8," + encodeURIComponent(html);
}

test.describe("V3 keyboard shortcuts and typing", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("typing, select-all + delete clears input (Cmd maps cross-OS)", async () => {
    const html = `<!doctype html>
      <input id="i1" autofocus />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#i1").click();
    await page.type("Hello World");

    await page.keyPress("Cmd+A");
    await page.keyPress("Delete");

    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#i1",
    );
    expect(value).toBe("");
  });

  test("accelerator does not inject printable text (Cmd+B does not type 'b')", async () => {
    const html = `<!doctype html>
      <input id="i" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#i").click();
    await page.type("xyz");

    await page.keyPress("Cmd+B");

    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#i",
    );
    expect(value).toBe("xyz");
  });

  test("Tab and Shift+Tab move focus", async () => {
    const html = `<!doctype html>
      <input id="a" />
      <input id="b" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#a").click();
    await page.keyPress("Tab");
    const active1 = await page.evaluate(
      () => (document.activeElement as HTMLElement)?.id || "",
    );
    expect(active1).toBe("b");

    await page.keyPress("Shift+Tab");
    const active2 = await page.evaluate(
      () => (document.activeElement as HTMLElement)?.id || "",
    );
    expect(active2).toBe("a");
  });

  test("cut clears the field (Cmd+X)", async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.type("cut-me");
    await page.keyPress("Cmd+A");
    await page.keyPress("Cmd+X");

    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("");
  });

  test("single printable via keyPress types characters (a, Shift+A, space)", async () => {
    const html = `<!doctype html>
      <input id="t" autofocus />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.keyPress("a");
    await page.keyPress("Shift+A");
    await page.keyPress(" ");

    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("aA ");
  });

  test("Backspace removes last char", async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.type("ab");
    await page.keyPress("Backspace");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("a");
  });

  test("Delete removes next char at caret", async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.type("abc");
    // place caret between a|bc
    await page.evaluate(() => {
      const el = document.getElementById("t") as HTMLInputElement;
      el.focus();
      el.setSelectionRange(1, 1);
    });
    await page.keyPress("Delete");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("ac");
  });

  test("ArrowLeft moves caret and typing inserts in middle", async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.type("ac");
    await page.keyPress("ArrowLeft");
    await page.keyPress("b");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("abc");
  });

  test("Enter inserts newline in textarea", async () => {
    const html = `<!doctype html>
      <textarea id="ta"></textarea>`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#ta").click();
    await page.keyPress("a");
    await page.keyPress("Enter");
    await page.keyPress("b");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLTextAreaElement)!.value,
      "#ta",
    );
    expect(value).toBe("a\nb");
  });

  test("Insert key (no-op for value)", async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.type("abc");
    await page.keyPress("Insert");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("abc");
  });

  test("Enter submits form from text input", async () => {
    const html = `<!doctype html>
      <form id="f">
        <input id="name" />
        <button id="submit">Go</button>
        <input id="submitted" />
      </form>
      <script>
        document.getElementById('f').addEventListener('submit', (e) => {
          e.preventDefault();
          document.getElementById('submitted').value = 'yes';
        });
      </script>`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#name").click();
    await page.type("foo");
    await page.keyPress("Enter");

    const submitted = await page.evaluate(
      () =>
        (document.getElementById("submitted") as HTMLInputElement)?.value || "",
    );
    expect(submitted).toBe("yes");
  });

  test("Enter in textarea does not submit form (inserts newline)", async () => {
    const html = `<!doctype html>
      <form id="f">
        <textarea id="ta"></textarea>
        <button id="submit">Go</button>
        <input id="submitted" />
      </form>
      <script>
        document.getElementById('f').addEventListener('submit', (e) => {
          e.preventDefault();
          document.getElementById('submitted').value = 'yes';
        });
      </script>`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#ta").click();
    await page.keyPress("a");
    await page.keyPress("Enter");
    await page.keyPress("b");

    const submitted = await page.evaluate(
      () =>
        (document.getElementById("submitted") as HTMLInputElement)?.value || "",
    );
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLTextAreaElement)!.value,
      "#ta",
    );
    expect(submitted).toBe("");
    expect(value).toBe("a\nb");
  });

  test('pressing "+" key types plus sign', async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    await page.keyPress("+");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("+");
  });

  test("modifier state clears on keyPress error", async () => {
    const html = `<!doctype html>
      <input id="t" />`;
    const page = await v3.context.awaitActivePage();
    await page.goto(dataUrl(html), {
      waitUntil: "domcontentloaded",
      timeoutMs: 15000,
    });

    await page.locator("#t").click();
    // Try invalid key that might throw
    try {
      await page.keyPress("Cmd+InvalidKey123");
    } catch {
      // Expected to fail
    }

    // Now try normal typing - should work if modifiers were cleared
    await page.type("ok");
    const value = await page.evaluate(
      (sel) => (document.querySelector(sel) as HTMLInputElement)!.value,
      "#t",
    );
    expect(value).toBe("ok");
  });
});


================================================
FILE: packages/core/tests/integration/locator-backend-node-id.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Locator.backendNodeId() - CDP DOM node ID", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("returns a valid backend node ID for an element", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <button id="btn">Click me</button>
          </body></html>`,
        ),
    );

    const locator = page.locator("button#btn");
    const nodeId = await locator.backendNodeId();

    // Backend node ID should be a valid number
    expect(typeof nodeId).toBe("number");
    expect(nodeId).toBeGreaterThan(0);
  });

  test("returns different node IDs for different elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="div1">First</div>
            <div id="div2">Second</div>
            <p id="p1">Third</p>
          </body></html>`,
        ),
    );

    const nodeId1 = await page.locator("div#div1").backendNodeId();
    const nodeId2 = await page.locator("div#div2").backendNodeId();
    const nodeId3 = await page.locator("p#p1").backendNodeId();

    // All node IDs should be unique
    expect(nodeId1).not.toBe(nodeId2);
    expect(nodeId2).not.toBe(nodeId3);
    expect(nodeId1).not.toBe(nodeId3);
  });

  test("returns consistent node ID for the same element", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input type="text" id="input" />
          </body></html>`,
        ),
    );

    const locator = page.locator("input#input");

    // Call multiple times on the same element
    const nodeId1 = await locator.backendNodeId();
    const nodeId2 = await locator.backendNodeId();

    // Should return the same ID (same element)
    expect(nodeId1).toBe(nodeId2);
  });

  test("returns node ID for nested elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="outer">
              <div id="middle">
                <span id="inner">Deep</span>
              </div>
            </div>
          </body></html>`,
        ),
    );

    const outerNodeId = await page.locator("div#outer").backendNodeId();
    const middleNodeId = await page.locator("div#middle").backendNodeId();
    const innerNodeId = await page.locator("span#inner").backendNodeId();

    // All should be valid and unique
    expect(outerNodeId).toBeGreaterThan(0);
    expect(middleNodeId).toBeGreaterThan(0);
    expect(innerNodeId).toBeGreaterThan(0);
    expect(new Set([outerNodeId, middleNodeId, innerNodeId]).size).toBe(3);
  });

  test("returns node ID for elements with various attributes", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <button class="btn primary" data-test="submit" aria-label="Submit form">Save</button>
          </body></html>`,
        ),
    );

    const locator = page.locator("button");
    const nodeId = await locator.backendNodeId();

    // Should work with complex elements
    expect(typeof nodeId).toBe("number");
    expect(nodeId).toBeGreaterThan(0);
  });

  test("returns node ID for form elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <form>
              <input type="email" id="email" placeholder="Email" />
              <textarea id="message"></textarea>
              <select id="country">
                <option value="us">USA</option>
                <option value="ca">Canada</option>
              </select>
              <button type="submit">Submit</button>
            </form>
          </body></html>`,
        ),
    );

    const emailNodeId = await page.locator("input#email").backendNodeId();
    const textareaNodeId = await page
      .locator("textarea#message")
      .backendNodeId();
    const selectNodeId = await page.locator("select#country").backendNodeId();
    const submitNodeId = await page
      .locator("button[type='submit']")
      .backendNodeId();

    // All form elements should have valid node IDs
    expect(emailNodeId).toBeGreaterThan(0);
    expect(textareaNodeId).toBeGreaterThan(0);
    expect(selectNodeId).toBeGreaterThan(0);
    expect(submitNodeId).toBeGreaterThan(0);

    // All should be unique
    const nodeIds = [emailNodeId, textareaNodeId, selectNodeId, submitNodeId];
    expect(new Set(nodeIds).size).toBe(4);
  });

  test("returns node ID for dynamically created elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="container"></div>
            <script>
              const container = document.getElementById('container');
              const newBtn = document.createElement('button');
              newBtn.id = 'dynamic-btn';
              newBtn.textContent = 'Dynamically created';
              container.appendChild(newBtn);
            </script>
          </body></html>`,
        ),
    );

    const locator = page.locator("button#dynamic-btn");
    const nodeId = await locator.backendNodeId();

    // Should work with dynamically created elements
    expect(typeof nodeId).toBe("number");
    expect(nodeId).toBeGreaterThan(0);
  });

  test("returns node ID for elements with text selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <button>Submit Form</button>
          </body></html>`,
        ),
    );

    const locator = page.locator("text=Submit Form");
    const nodeId = await locator.backendNodeId();

    // Should work with text-based selectors
    expect(typeof nodeId).toBe("number");
    expect(nodeId).toBeGreaterThan(0);
  });
});


================================================
FILE: packages/core/tests/integration/locator-content-methods.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Locator content methods (textContent, innerHtml, innerText, inputValue)", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch((e) => {
      void e;
    });
  });

  test("Locator.textContent() returns raw text including hidden content", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="content">
              Hello
              <span style="display:none">Hidden</span>
              World
            </div>
          </body></html>`,
        ),
    );

    const content = await page.mainFrame().locator("#content").textContent();
    // textContent includes all text nodes, even hidden ones
    expect(content).toContain("Hello");
    expect(content).toContain("Hidden");
    expect(content).toContain("World");
  });

  test("Locator.innerText() returns visible text only", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="content">
              Visible
              <span style="display:none">Hidden</span>
              Text
            </div>
          </body></html>`,
        ),
    );

    const text = await page.mainFrame().locator("#content").innerText();
    // innerText is layout-aware and excludes hidden elements
    expect(text).toContain("Visible");
    expect(text).toContain("Text");
    expect(text).not.toContain("Hidden");
  });

  test("Locator.innerHtml() returns HTML markup", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="container">
              <p class="para">Hello</p>
              <strong>World</strong>
            </div>
          </body></html>`,
        ),
    );

    const html = await page.mainFrame().locator("#container").innerHtml();
    expect(html).toContain('<p class="para">Hello</p>');
    expect(html).toContain("<strong>World</strong>");
  });

  test("Locator.inputValue() reads value from input elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="text-input" type="text" value="hello world" />
            <textarea id="textarea">multi
line
text</textarea>
            <input id="number-input" type="number" value="42" />
          </body></html>`,
        ),
    );

    const textValue = await page
      .mainFrame()
      .locator("#text-input")
      .inputValue();
    expect(textValue).toBe("hello world");

    const taValue = await page.mainFrame().locator("#textarea").inputValue();
    expect(taValue).toBe("multi\nline\ntext");

    const numValue = await page
      .mainFrame()
      .locator("#number-input")
      .inputValue();
    expect(numValue).toBe("42");
  });

  test("Locator.textContent() on empty elements returns empty string", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="empty"></div>
            <span id="whitespace">   </span>
          </body></html>`,
        ),
    );

    const empty = await page.mainFrame().locator("#empty").textContent();
    expect(empty).toBe("");

    const whitespace = await page
      .mainFrame()
      .locator("#whitespace")
      .textContent();
    expect(whitespace.trim()).toBe("");
  });

  test("Locator.innerText() with nested elements and formatting", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="formatted">
              <p>Line 1</p>
              <p>Line 2</p>
              <ul>
                <li>Item 1</li>
                <li>Item 2</li>
              </ul>
            </div>
          </body></html>`,
        ),
    );

    const text = await page.mainFrame().locator("#formatted").innerText();
    expect(text).toContain("Line 1");
    expect(text).toContain("Line 2");
    expect(text).toContain("Item 1");
    expect(text).toContain("Item 2");
  });

  test("Locator.inputValue() on contenteditable elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="editable" contenteditable="true">Editable content</div>
          </body></html>`,
        ),
    );

    const value = await page.mainFrame().locator("#editable").inputValue();
    expect(value).toBe("Editable content");
  });

  test("Locator.innerHtml() preserves attributes and structure", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="complex">
              <a href="/link" class="link-class">Link</a>
              <img src="image.png" alt="test" />
            </div>
          </body></html>`,
        ),
    );

    const html = await page.mainFrame().locator("#complex").innerHtml();
    expect(html).toContain('href="/link"');
    expect(html).toContain('class="link-class"');
    expect(html).toContain('src="image.png"');
    expect(html).toContain('alt="test"');
  });

  test("Locator.textContent() vs innerText() with script/style tags", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="mixed">
              Visible text
              <script>console.log('script');</script>
              <style>body { color: red; }</style>
              More visible
            </div>
          </body></html>`,
        ),
    );

    const textContent = await page.mainFrame().locator("#mixed").textContent();
    // textContent includes script content
    expect(textContent).toContain("Visible text");
    expect(textContent).toContain("More visible");

    const innerText = await page.mainFrame().locator("#mixed").innerText();
    // innerText excludes script/style
    expect(innerText).toContain("Visible text");
    expect(innerText).toContain("More visible");
    expect(innerText).not.toContain("console.log");
  });

  test("Locator.inputValue() returns empty string for non-input elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="div">Not an input</div>
            <input id="empty-input" type="text" value="" />
          </body></html>`,
        ),
    );

    const divValue = await page.mainFrame().locator("#div").inputValue();
    expect(divValue).toBe("");

    const emptyInput = await page
      .mainFrame()
      .locator("#empty-input")
      .inputValue();
    expect(emptyInput).toBe("");
  });
});


================================================
FILE: packages/core/tests/integration/locator-count-iframe.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe("Locator count() method with iframes", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("count() does not search inside iframes by default", async () => {
    const page = v3.context.pages()[0];

    // Create a page with buttons in main frame and iframe
    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <button>Main Frame Button 1</button>
        <button>Main Frame Button 2</button>
        <iframe id="test-iframe" srcdoc="
          <button>Iframe Button 1</button>
          <button>Iframe Button 2</button>
          <button>Iframe Button 3</button>
        "></iframe>
      `),
    );

    // Wait for iframe to load
    await new Promise((resolve) => setTimeout(resolve, 500));

    // Count buttons in main frame only
    const mainFrameCount = await page.mainFrame().locator("button").count();
    expect(mainFrameCount).toBe(2); // Should only find buttons in main frame
  });

  test("count() works with frameLocator for iframe content", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <button>Main Frame Button</button>
        <iframe id="test-iframe" srcdoc="
          <button>Iframe Button 1</button>
          <button>Iframe Button 2</button>
          <button>Iframe Button 3</button>
        "></iframe>
      `),
    );

    // Wait for iframe to load
    await new Promise((resolve) => setTimeout(resolve, 500));

    // Count buttons in iframe using frameLocator
    const iframeLocator = page.frameLocator("#test-iframe");
    const iframeCount = await iframeLocator.locator("button").count();
    expect(iframeCount).toBe(3); // Should find 3 buttons in iframe
  });

  test("count() with nested iframes", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <div class="level-0">Main Frame</div>
        <iframe id="frame1" srcdoc="
          <div class='level-1'>Frame 1</div>
          <iframe id='frame2' srcdoc='
            <div class=&quot;level-2&quot;>Frame 2</div>
            <div class=&quot;level-2&quot;>Frame 2</div>
          '></iframe>
        "></iframe>
      `),
    );

    // Wait for all iframes to load
    await new Promise((resolve) => setTimeout(resolve, 800));

    // Count at each level
    const mainCount = await page.mainFrame().locator(".level-0").count();
    expect(mainCount).toBe(1);

    const frame1Count = await page
      .frameLocator("#frame1")
      .locator(".level-1")
      .count();
    expect(frame1Count).toBe(1);

    const frame2Count = await page
      .frameLocator("#frame1")
      .frameLocator("#frame2")
      .locator(".level-2")
      .count();
    expect(frame2Count).toBe(2);
  });

  test("count() with same selector in multiple contexts", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <span class="item">Main 1</span>
        <span class="item">Main 2</span>
        <iframe id="frame1" srcdoc="
          <span class='item'>Frame1 Item</span>
        "></iframe>
        <iframe id="frame2" srcdoc="
          <span class='item'>Frame2 Item 1</span>
          <span class='item'>Frame2 Item 2</span>
          <span class='item'>Frame2 Item 3</span>
        "></iframe>
      `),
    );

    // Wait for iframes to load
    await new Promise((resolve) => setTimeout(resolve, 500));

    // Count in each context
    const mainCount = await page.mainFrame().locator(".item").count();
    const frame1Count = await page
      .frameLocator("#frame1")
      .locator(".item")
      .count();
    const frame2Count = await page
      .frameLocator("#frame2")
      .locator(".item")
      .count();

    expect(mainCount).toBe(2); // Main frame items only
    expect(frame1Count).toBe(1); // Frame 1 items only
    expect(frame2Count).toBe(3); // Frame 2 items only
  });

  test("count() returns 0 for non-existent iframe", async () => {
    const page = v3.context.pages()[0];

    await page.goto("data:text/html,<div>No iframes here</div>");

    try {
      const frameLocator = page.frameLocator("#non-existent");
      await frameLocator.locator("button").count();
      // If we get here, the test should fail
      expect(true).toBe(false);
    } catch (error) {
      // Expected behavior - frameLocator should throw when iframe doesn't exist
      expect(error.message).toContain(
        "Could not find an element for the given xPath(s):",
      );
    }
  });
});


================================================
FILE: packages/core/tests/integration/locator-count.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe("Locator count() method tests", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("count() returns correct number for CSS selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html,<div class='test'>1</div><div class='test'>2</div><div class='test'>3</div><span>4</span>",
    );

    const locator = page.mainFrame().locator(".test");
    const count = await locator.count();

    expect(count).toBe(3);
  });

  test("count() returns 0 for non-matching selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto("data:text/html,<div>Test</div>");

    const locator = page.mainFrame().locator(".non-existent");
    const count = await locator.count();

    expect(count).toBe(0);
  });

  test("count() works with XPath selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html,<button>Button 1</button><button>Button 2</button><button>Button 3</button>",
    );

    const locator = page.mainFrame().locator("//button");
    const count = await locator.count();

    expect(count).toBe(3);
  });

  test("count() works with text selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html,<div>Click me</div><button>Click me</button><span>Don't click me</span>",
    );

    const locator = page.mainFrame().locator("text=Click me");
    const count = await locator.count();

    // Case-insensitive substring match: also matches "Don't click me"
    expect(count).toBe(3);
  });

  test("count() handles shadow DOM elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div id="host"></div>' +
            "<script>" +
            'const host = document.getElementById("host");' +
            'const shadow = host.attachShadow({mode: "open"});' +
            'shadow.innerHTML = "<button>1</button><button>2</button>";' +
            "</script>",
        ),
      { waitUntil: "load", timeoutMs: 30000 },
    );

    // Wait a bit for shadow DOM to be attached
    await new Promise((resolve) => setTimeout(resolve, 100));

    const locator = page.mainFrame().locator("button");
    const count = await locator.count();

    expect(count).toBe(2);
  });

  test("count() works with complex CSS selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html,<div class='container'><span class='item'>1</span><span class='item'>2</span></div><div><span class='item'>3</span></div>",
    );

    const locator = page.mainFrame().locator(".container .item");
    const count = await locator.count();

    expect(count).toBe(2);
  });
});


================================================
FILE: packages/core/tests/integration/locator-fill.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { StagehandLocatorError } from "../../lib/v3/types/public/sdkErrors.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Locator.fill()", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch((e) => {
      void e;
    });
  });

  test("fills date inputs via value setter even when beforeinput blocks insertText", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="date" type="date" />
            <script>
              const input = document.getElementById('date');
              input.addEventListener('beforeinput', (e) => {
                if (e && e.inputType === 'insertText') e.preventDefault();
              });
            </script>
          </body></html>`,
        ),
    );

    const dateInput = page.mainFrame().locator("xpath=/html/body/input");
    await dateInput.fill("2026-01-01");

    const value = await dateInput.inputValue();
    expect(value).toBe("2026-01-01");
  });

  test("xpath case: throws StagehandLocatorError when fill encounters an exception", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="date" type="date" />
          </body></html>`,
        ),
    );

    await page.waitForSelector("xpath=/html/body/input");

    await page.evaluate(() => {
      const input = document.querySelector("input");
      Object.defineProperty(input, "isConnected", {
        get() {
          throw new Error("boom");
        },
      });
    });

    const dateInput = page.mainFrame().locator("xpath=/html/body/input");
    let error: unknown;
    try {
      await dateInput.fill("2026-01-01");
    } catch (err) {
      error = err;
    }

    expect(error).toBeInstanceOf(StagehandLocatorError);
    if (error instanceof Error) {
      // Log the message so it's visible in test output.
      expect(error.message).toContain("Error Filling Element");
      expect(error.message).toContain("selector: xpath=/html/body/input");
      expect(error.message).toContain("boom");
    }
  });

  test("css selector case: throws StagehandLocatorError when fill encounters an exception", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="date" type="date" />
          </body></html>`,
        ),
    );

    await page.waitForSelector("#date");

    // Override in main world
    await page.evaluate(() => {
      const input = document.querySelector("input");
      Object.defineProperty(input, "isConnected", {
        get() {
          throw new Error("boom");
        },
        configurable: true,
      });
    });

    // Also override in the isolated world that CSS selectors use
    const frameId = page.mainFrameId();
    const { executionContextId } = await page.sendCDP<{
      executionContextId: number;
    }>("Page.createIsolatedWorld", {
      frameId,
      worldName: "v3-world",
    });

    await page.sendCDP("Runtime.evaluate", {
      expression: `(() => {
        const input = document.querySelector('input');
        if (input) {
          Object.defineProperty(input, 'isConnected', {
            get() { throw new Error("boom"); },
            configurable: true
          });
        }
      })()`,
      contextId: executionContextId,
    });

    const dateInput = page.mainFrame().locator("#date");
    let error: unknown;
    try {
      await dateInput.fill("2026-01-01");
    } catch (err) {
      error = err;
    }

    expect(error).toBeInstanceOf(StagehandLocatorError);
    if (error instanceof Error) {
      expect(error.message).toContain("Error Filling Element");
      expect(error.message).toContain("selector: #date");
      expect(error.message).toContain("boom");
    }
  });
});


================================================
FILE: packages/core/tests/integration/locator-input-methods.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Locator input methods (fill, type, hover, isVisible, isChecked)", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch((e) => {
      void e;
    });
  });

  test("Locator.fill() sets input value directly", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="name" type="text" />
            <div id="out"></div>
          </body></html>`,
        ),
    );

    const input = page.mainFrame().locator("#name");
    await input.fill("Hello World");

    const value = await input.inputValue();
    expect(value).toBe("Hello World");
  });

  test("Locator.type() types text character by character", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="search" type="text" />
          </body></html>`,
        ),
    );

    const input = page.mainFrame().locator("#search");
    await input.type("test123", { delay: 10 });

    const value = await input.inputValue();
    expect(value).toBe("test123");
  });

  test("Locator.hover() moves mouse to element center", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <button id="btn" onmouseover="this.dataset.hovered='true'" onmouseout="this.dataset.hovered='false'">Hover Me</button>
          </body></html>`,
        ),
    );

    const btn = page.mainFrame().locator("#btn");
    await btn.hover();

    const hovered = await page.mainFrame().evaluate(() => {
      const b = document.getElementById("btn") as HTMLButtonElement | null;
      return b?.dataset.hovered === "true";
    });

    expect(hovered).toBe(true);
  });

  test("Locator.isVisible() returns true for visible elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <div id="visible">I am visible</div>
            <div id="hidden" style="display:none">I am hidden</div>
            <div id="invisible" style="visibility:hidden">I am invisible</div>
            <div id="transparent" style="opacity:0">I am transparent</div>
            <div id="zero-size" style="width:0;height:0">Zero size</div>
          </body></html>`,
        ),
    );

    const visible = await page.mainFrame().locator("#visible").isVisible();
    expect(visible).toBe(true);

    const hidden = await page.mainFrame().locator("#hidden").isVisible();
    expect(hidden).toBe(false);

    const invisible = await page.mainFrame().locator("#invisible").isVisible();
    expect(invisible).toBe(false);

    const transparent = await page
      .mainFrame()
      .locator("#transparent")
      .isVisible();
    expect(transparent).toBe(false);

    const zeroSize = await page.mainFrame().locator("#zero-size").isVisible();
    expect(zeroSize).toBe(false);
  });

  test("Locator.isChecked() detects checkbox state", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="checked" type="checkbox" checked />
            <input id="unchecked" type="checkbox" />
            <input id="radio-selected" type="radio" name="opt" checked />
            <input id="radio-unselected" type="radio" name="opt" />
          </body></html>`,
        ),
    );

    const checked = await page.mainFrame().locator("#checked").isChecked();
    expect(checked).toBe(true);

    const unchecked = await page.mainFrame().locator("#unchecked").isChecked();
    expect(unchecked).toBe(false);

    const radioSelected = await page
      .mainFrame()
      .locator("#radio-selected")
      .isChecked();
    expect(radioSelected).toBe(true);

    const radioUnselected = await page
      .mainFrame()
      .locator("#radio-unselected")
      .isChecked();
    expect(radioUnselected).toBe(false);
  });

  test("Locator.fill() on textarea", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <textarea id="ta"></textarea>
          </body></html>`,
        ),
    );

    const ta = page.mainFrame().locator("#ta");
    await ta.fill("Multi\nline\ntext");

    const value = await ta.inputValue();
    expect(value).toBe("Multi\nline\ntext");
  });

  test("Locator.fill() clears and sets new value", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <input id="inp" type="text" value="initial" />
          </body></html>`,
        ),
    );

    const inp = page.mainFrame().locator("#inp");

    let value = await inp.inputValue();
    expect(value).toBe("initial");

    await inp.fill("replaced");
    value = await inp.inputValue();
    expect(value).toBe("replaced");
  });
});


================================================
FILE: packages/core/tests/integration/locator-nth.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe("Locator nth() method tests", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("nth() returns correct element for CSS selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div class="test" id="first">1</div>' +
            '<div class="test" id="second">2</div>' +
            '<div class="test" id="third">3</div>' +
            '<span id="other">4</span>',
        ),
    );

    // Test nth() with CSS selectors
    const locator0 = page.mainFrame().locator(".test").nth(0);
    const text0 = await locator0.textContent();
    expect(text0).toBe("1");

    const locator1 = page.mainFrame().locator(".test").nth(1);
    const text1 = await locator1.textContent();
    expect(text1).toBe("2");

    const locator2 = page.mainFrame().locator(".test").nth(2);
    const text2 = await locator2.textContent();
    expect(text2).toBe("3");
  });

  test("nth() returns correct element for XPath selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<button id="btn1">Button 1</button>' +
            '<button id="btn2">Button 2</button>' +
            '<button id="btn3">Button 3</button>',
        ),
    );

    // Test nth() with XPath selectors
    const locator0 = page.mainFrame().locator("//button").nth(0);
    const text0 = await locator0.textContent();
    expect(text0).toBe("Button 1");

    const locator1 = page.mainFrame().locator("//button").nth(1);
    const text1 = await locator1.textContent();
    expect(text1).toBe("Button 2");

    const locator2 = page.mainFrame().locator("//button").nth(2);
    const text2 = await locator2.textContent();
    expect(text2).toBe("Button 3");
  });

  test("nth() returns correct element for text selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div id="d1">Click me</div>' +
            '<button id="b1">Click me</button>' +
            '<span id="s1">Click me</span>',
        ),
    );

    // Test nth() with text selectors
    const locator0 = page.mainFrame().locator("text=Click me").nth(0);
    const text0 = await locator0.textContent();
    expect(text0).toBe("Click me");

    const locator1 = page.mainFrame().locator("text=Click me").nth(1);
    const text1 = await locator1.textContent();
    expect(text1).toBe("Click me");

    const locator2 = page.mainFrame().locator("text=Click me").nth(2);
    const text2 = await locator2.textContent();
    expect(text2).toBe("Click me");
  });

  test("nth() with shadow DOM", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div id="host"></div>' +
            "<script>" +
            'const host = document.getElementById("host");' +
            'const shadow = host.attachShadow({mode: "open"});' +
            'shadow.innerHTML = "<button>Shadow Button 1</button><button>Shadow Button 2</button><button>Shadow Button 3</button>";' +
            "</script>",
        ),
      { waitUntil: "load", timeoutMs: 30000 },
    );

    // Wait a bit for shadow DOM to be attached
    await new Promise((resolve) => setTimeout(resolve, 100));

    // Test nth() with shadow DOM elements
    const locator0 = page.mainFrame().locator("button").nth(0);
    const text0 = await locator0.textContent();
    expect(text0).toBe("Shadow Button 1");

    const locator1 = page.mainFrame().locator("button").nth(1);
    const text1 = await locator1.textContent();
    expect(text1).toBe("Shadow Button 2");

    const locator2 = page.mainFrame().locator("button").nth(2);
    const text2 = await locator2.textContent();
    expect(text2).toBe("Shadow Button 3");
  });

  test("nth() with out of bounds index throws error", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div class="test">1</div>' + '<div class="test">2</div>',
        ),
    );

    // Test with out of bounds index - should throw an error
    const locator = page.mainFrame().locator(".test").nth(5);
    let error = null;
    try {
      await locator.textContent();
    } catch (e) {
      error = e;
    }

    expect(error).not.toBeNull();
  });

  test("nth() works with complex CSS selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div class="container">' +
            '<span class="item">1</span>' +
            '<span class="item">2</span>' +
            "</div>" +
            "<div>" +
            '<span class="item">3</span>' +
            "</div>",
        ),
    );

    // Test nth() with complex CSS selectors
    const locator0 = page.mainFrame().locator(".container .item").nth(0);
    const text0 = await locator0.textContent();
    expect(text0).toBe("1");

    const locator1 = page.mainFrame().locator(".container .item").nth(1);
    const text1 = await locator1.textContent();
    expect(text1).toBe("2");
  });

  test("nth() can be chained with other locator methods", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div class="test">First</div>' +
            '<div class="test">Second</div>' +
            '<div class="test">Third</div>',
        ),
    );

    // Test that nth() returns a Locator that can be used for other actions
    const locator = page.mainFrame().locator(".test").nth(1);
    const text = await locator.textContent();
    expect(text).toBe("Second");

    // Verify it's visible
    const isVisible = await locator.isVisible();
    expect(isVisible).toBe(true);
  });

  test("nth(0) is equivalent to first()", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<div class="test">First</div>' +
            '<div class="test">Second</div>' +
            '<div class="test">Third</div>',
        ),
    );

    // Verify nth(0) returns the same element as first()
    const nthLocator = page.mainFrame().locator(".test").nth(0);
    const nthText = await nthLocator.textContent();

    const firstLocator = page.mainFrame().locator(".test").first();
    const firstText = await firstLocator.textContent();

    expect(nthText).toBe(firstText);
    expect(nthText).toBe("First");
  });

  test("nth() works correctly with iframe selectors", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          '<button id="main1">Main Button 1</button>' +
            '<button id="main2">Main Button 2</button>' +
            '<iframe id="frame1"></iframe>' +
            "<script>" +
            'const frame = document.getElementById("frame1");' +
            "const doc = frame.contentDocument;" +
            "doc.open();" +
            'doc.write("<button>Frame Button 1</button><button>Frame Button 2</button>");' +
            "doc.close();" +
            "</script>",
        ),
    );

    // Wait for iframe to load
    await new Promise((resolve) => setTimeout(resolve, 100));

    // Test that nth() works correctly with buttons in the main frame
    const mainLocator0 = page.mainFrame().locator("button").nth(0);
    const mainText0 = await mainLocator0.textContent();
    expect(mainText0).toBe("Main Button 1");

    const mainLocator1 = page.mainFrame().locator("button").nth(1);
    const mainText1 = await mainLocator1.textContent();
    expect(mainText1).toBe("Main Button 2");
  });
});


================================================
FILE: packages/core/tests/integration/locator-select-option.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Locator.selectOption() method", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch((e) => {
      void e; // ignore cleanup errors
    });
  });

  test("selectOption() selects single option by value", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="fruit">
              <option value="">-- Choose --</option>
              <option value="apple">Apple</option>
              <option value="banana">Banana</option>
              <option value="cherry">Cherry</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#fruit");
    const selected = await select.selectOption("banana");

    expect(selected).toEqual(["banana"]);

    const value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("fruit") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("banana");
  });

  test("selectOption() selects option by label/text", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="country">
              <option value="us">United States</option>
              <option value="uk">United Kingdom</option>
              <option value="ca">Canada</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#country");
    const selected = await select.selectOption("United Kingdom");

    expect(selected).toEqual(["uk"]);
  });

  test("selectOption() selects multiple options in multiple select", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="colors" multiple>
              <option value="red">Red</option>
              <option value="green">Green</option>
              <option value="blue">Blue</option>
              <option value="yellow">Yellow</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#colors");
    const selected = await select.selectOption(["red", "blue"]);

    expect(selected.sort()).toEqual(["blue", "red"]);

    const values = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("colors") as HTMLSelectElement | null;
      return Array.from(s?.selectedOptions ?? []).map((o) => o.value);
    });
    expect(values.sort()).toEqual(["blue", "red"]);
  });

  test("selectOption() deselects previous option on single select", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="size">
              <option value="s">Small</option>
              <option value="m" selected>Medium</option>
              <option value="l">Large</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#size");

    let value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("size") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("m");

    await select.selectOption("l");

    value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("size") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("l");
  });

  test("selectOption() triggers change event", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="opt">
              <option value="a">Option A</option>
              <option value="b">Option B</option>
            </select>
            <div id="out"></div>
            <script>
              const select = document.getElementById('opt');
              const out = document.getElementById('out');
              select.addEventListener('change', () => {
                out.textContent = 'changed-' + select.value;
              });
            </script>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#opt");
    await select.selectOption("b");

    const output = await page.mainFrame().evaluate(() => {
      const out = document.getElementById("out");
      return out?.textContent;
    });
    expect(output).toBe("changed-b");
  });

  test("selectOption() with optgroup structure", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="grouped">
              <optgroup label="Fruits">
                <option value="apple">Apple</option>
                <option value="orange">Orange</option>
              </optgroup>
              <optgroup label="Vegetables">
                <option value="carrot">Carrot</option>
                <option value="celery">Celery</option>
              </optgroup>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#grouped");
    await select.selectOption("celery");

    const value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("grouped") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("celery");
  });

  test("selectOption() returns array of selected values", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="multi" multiple>
              <option value="1">One</option>
              <option value="2">Two</option>
              <option value="3">Three</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#multi");
    const selected = await select.selectOption(["1", "3"]);

    expect(selected).toContain("1");
    expect(selected).toContain("3");
    expect(selected.length).toBe(2);
  });

  test("selectOption() with empty string value", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="opt">
              <option value="">None</option>
              <option value="yes">Yes</option>
              <option value="no">No</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#opt");
    const selected = await select.selectOption("");

    expect(selected).toEqual([""]);

    const value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("opt") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("");
  });

  test("selectOption() with numeric values", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="nums">
              <option value="1">One</option>
              <option value="2">Two</option>
              <option value="10">Ten</option>
              <option value="100">Hundred</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#nums");
    await select.selectOption("10");

    const value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("nums") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("10");
  });

  test("selectOption() with disabled option", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body>
            <select id="mixed">
              <option value="a">Available</option>
              <option value="b" disabled>Unavailable</option>
              <option value="c">Available</option>
            </select>
          </body></html>`,
        ),
    );

    const select = page.mainFrame().locator("#mixed");
    // Should still select disabled option if explicitly requested
    await select.selectOption("b");

    const value = await page.mainFrame().evaluate(() => {
      const s = document.getElementById("mixed") as HTMLSelectElement | null;
      return s?.value;
    });
    expect(value).toBe("b");
  });
});


================================================
FILE: packages/core/tests/integration/logger-initialization.spec.ts
================================================
import { test, expect } from "@playwright/test";
import {
  bindInstanceLogger,
  unbindInstanceLogger,
  withInstanceLogContext,
  v3Logger,
} from "../../lib/v3/logger.js";
import type { LogLine } from "../../lib/v3/types/public/logs.js";

test.describe("V3 Logger Instance Routing", () => {
  test.afterEach(() => {
    // Clean up is handled by unbindInstanceLogger calls in tests
  });

  test("bindInstanceLogger routes logs to correct instance", () => {
    const instanceId = "test-instance-001";
    const capturedLogs: LogLine[] = [];

    bindInstanceLogger(instanceId, (line) => {
      capturedLogs.push(line);
    });

    try {
      // Log within context
      withInstanceLogContext(instanceId, () => {
        v3Logger({
          category: "test",
          message: "Test message for instance",
          level: 1,
        });
      });

      // Should have captured the log
      expect(capturedLogs.length).toBe(1);
      expect(capturedLogs[0].message).toBe("Test message for instance");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("unbindInstanceLogger stops routing", () => {
    const instanceId = "test-instance-002";
    const capturedLogs: LogLine[] = [];
    const consoleOutput: string[] = [];
    const originalConsoleLog = console.log;

    try {
      console.log = (msg: string) => {
        consoleOutput.push(msg);
      };

      bindInstanceLogger(instanceId, (line) => {
        capturedLogs.push(line);
      });

      // Unbind immediately
      unbindInstanceLogger(instanceId);

      // Log - should fall back to console
      withInstanceLogContext(instanceId, () => {
        v3Logger({
          category: "test",
          message: "After unbind",
          level: 1,
        });
      });

      // Should not have captured via instance logger
      expect(capturedLogs.length).toBe(0);
      // But should have logged to console
      expect(consoleOutput.length).toBeGreaterThan(0);
    } finally {
      console.log = originalConsoleLog;
      unbindInstanceLogger(instanceId);
    }
  });

  test("multiple instances have isolated log routing", () => {
    const instance1Id = "test-instance-1";
    const instance2Id = "test-instance-2";
    const instance1Logs: LogLine[] = [];
    const instance2Logs: LogLine[] = [];

    bindInstanceLogger(instance1Id, (line) => instance1Logs.push(line));
    bindInstanceLogger(instance2Id, (line) => instance2Logs.push(line));

    try {
      // Log from instance 1
      withInstanceLogContext(instance1Id, () => {
        v3Logger({
          category: "test",
          message: "From instance 1",
          level: 1,
        });
      });

      // Log from instance 2
      withInstanceLogContext(instance2Id, () => {
        v3Logger({
          category: "test",
          message: "From instance 2",
          level: 1,
        });
      });

      // Each instance should have only its own log
      expect(instance1Logs.length).toBe(1);
      expect(instance2Logs.length).toBe(1);
      expect(instance1Logs[0].message).toBe("From instance 1");
      expect(instance2Logs[0].message).toBe("From instance 2");
    } finally {
      unbindInstanceLogger(instance1Id);
      unbindInstanceLogger(instance2Id);
    }
  });

  test("v3Logger falls back to console when no instance context", () => {
    const capturedLogs: string[] = [];
    const originalConsoleLog = console.log;

    try {
      console.log = (msg: string) => {
        capturedLogs.push(msg);
      };

      // Log without any instance context
      v3Logger({
        category: "test",
        message: "Console fallback log",
        level: 1,
      });

      // Should have used console logger
      expect(capturedLogs.length).toBeGreaterThan(0);
      const logOutput = capturedLogs.join("\n");
      expect(logOutput).toContain("Console fallback log");
    } finally {
      console.log = originalConsoleLog;
    }
  });

  test("v3Logger falls back to console when instance logger throws", () => {
    const instanceId = "failing-instance";
    const capturedConsoleLogs: string[] = [];
    const originalConsoleLog = console.log;

    try {
      console.log = (msg: string) => {
        capturedConsoleLogs.push(msg);
      };

      // Bind a logger that throws
      bindInstanceLogger(instanceId, () => {
        throw new Error("Instance logger failed");
      });

      // Should fall back to console without throwing
      withInstanceLogContext(instanceId, () => {
        expect(() => {
          v3Logger({
            category: "test",
            message: "Test with failing instance logger",
            level: 1,
          });
        }).not.toThrow();
      });

      // Console should have received the log as fallback
      expect(capturedConsoleLogs.length).toBeGreaterThan(0);
      const logOutput = capturedConsoleLogs.join("\n");
      expect(logOutput).toContain("Test with failing instance logger");
    } finally {
      console.log = originalConsoleLog;
      unbindInstanceLogger(instanceId);
    }
  });

  test("withInstanceLogContext nests properly", () => {
    const outerInstanceId = "outer-instance";
    const innerInstanceId = "inner-instance";
    const outerLogs: LogLine[] = [];
    const innerLogs: LogLine[] = [];

    bindInstanceLogger(outerInstanceId, (line) => outerLogs.push(line));
    bindInstanceLogger(innerInstanceId, (line) => innerLogs.push(line));

    try {
      withInstanceLogContext(outerInstanceId, () => {
        v3Logger({
          category: "test",
          message: "Outer context",
          level: 1,
        });

        withInstanceLogContext(innerInstanceId, () => {
          v3Logger({
            category: "test",
            message: "Inner context",
            level: 1,
          });
        });

        v3Logger({
          category: "test",
          message: "Back to outer context",
          level: 1,
        });
      });

      // Outer instance should have 2 logs
      expect(outerLogs.length).toBe(2);
      expect(outerLogs[0].message).toBe("Outer context");
      expect(outerLogs[1].message).toBe("Back to outer context");

      // Inner instance should have 1 log
      expect(innerLogs.length).toBe(1);
      expect(innerLogs[0].message).toBe("Inner context");
    } finally {
      unbindInstanceLogger(outerInstanceId);
      unbindInstanceLogger(innerInstanceId);
    }
  });

  test("withInstanceLogContext returns function result", () => {
    const instanceId = "return-test-instance";
    bindInstanceLogger(instanceId, () => {});

    try {
      const result = withInstanceLogContext(instanceId, () => {
        return { success: true, value: 42 };
      });

      expect(result).toEqual({ success: true, value: 42 });
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("withInstanceLogContext works with async functions", async () => {
    const instanceId = "async-test-instance";
    const capturedLogs: LogLine[] = [];

    bindInstanceLogger(instanceId, (line) => capturedLogs.push(line));

    try {
      const asyncResult = await withInstanceLogContext(instanceId, async () => {
        v3Logger({
          category: "test",
          message: "Log from async context",
          level: 1,
        });

        await new Promise((resolve) => setTimeout(resolve, 10));

        v3Logger({
          category: "test",
          message: "Log after await",
          level: 1,
        });

        return "async result";
      });

      expect(asyncResult).toBe("async result");
      expect(capturedLogs.length).toBe(2);
      expect(capturedLogs[0].message).toBe("Log from async context");
      expect(capturedLogs[1].message).toBe("Log after await");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("console fallback formats different log levels correctly", () => {
    const consoleOutput: { level: string; msg: string }[] = [];
    const originalConsoleLog = console.log;
    const originalConsoleError = console.error;
    const originalConsoleDebug = console.debug;

    try {
      console.log = (msg: string) => {
        consoleOutput.push({ level: "log", msg });
      };
      console.error = (msg: string) => {
        consoleOutput.push({ level: "error", msg });
      };
      console.debug = (msg: string) => {
        consoleOutput.push({ level: "debug", msg });
      };

      // Test error level (0)
      v3Logger({
        category: "test",
        message: "Error message",
        level: 0,
      });

      // Test info level (1)
      v3Logger({
        category: "test",
        message: "Info message",
        level: 1,
      });

      // Test debug level (2)
      v3Logger({
        category: "test",
        message: "Debug message",
        level: 2,
      });

      expect(consoleOutput.length).toBe(3);
      expect(consoleOutput[0].level).toBe("error");
      expect(consoleOutput[0].msg).toContain("ERROR");
      expect(consoleOutput[0].msg).toContain("Error message");

      expect(consoleOutput[1].level).toBe("log");
      expect(consoleOutput[1].msg).toContain("INFO");
      expect(consoleOutput[1].msg).toContain("Info message");

      expect(consoleOutput[2].level).toBe("debug");
      expect(consoleOutput[2].msg).toContain("DEBUG");
      expect(consoleOutput[2].msg).toContain("Debug message");
    } finally {
      console.log = originalConsoleLog;
      console.error = originalConsoleError;
      console.debug = originalConsoleDebug;
    }
  });

  test("console fallback formats auxiliary data", () => {
    const consoleOutput: string[] = [];
    const originalConsoleLog = console.log;

    try {
      console.log = (msg: string) => {
        consoleOutput.push(msg);
      };

      v3Logger({
        category: "test",
        message: "Message with auxiliary",
        level: 1,
        auxiliary: {
          stringValue: { value: "test", type: "string" },
          integerValue: { value: "42", type: "integer" },
          objectValue: {
            value: JSON.stringify({ nested: "data" }),
            type: "object",
          },
        },
      });

      expect(consoleOutput.length).toBe(1);
      const output = consoleOutput[0];
      expect(output).toContain("Message with auxiliary");
      expect(output).toContain("stringValue");
      expect(output).toContain("integerValue");
      expect(output).toContain("objectValue");
    } finally {
      console.log = originalConsoleLog;
    }
  });

  test("concurrent instances don't interfere", () => {
    const instances = Array.from({ length: 10 }, (_, i) => `instance-${i}`);
    const logsByInstance = new Map<string, LogLine[]>();

    // Bind all instances
    instances.forEach((id) => {
      const logs: LogLine[] = [];
      logsByInstance.set(id, logs);
      bindInstanceLogger(id, (line) => logs.push(line));
    });

    try {
      // Log from each instance
      instances.forEach((id, index) => {
        withInstanceLogContext(id, () => {
          v3Logger({
            category: "test",
            message: `Message from ${id}`,
            level: 1,
            auxiliary: {
              index: { value: String(index), type: "integer" },
            },
          });
        });
      });

      // Verify each instance received only its own log
      instances.forEach((id) => {
        const logs = logsByInstance.get(id)!;
        expect(logs.length).toBe(1);
        expect(logs[0].message).toBe(`Message from ${id}`);
      });
    } finally {
      instances.forEach((id) => unbindInstanceLogger(id));
    }
  });
});

test.describe("V3 Logger with External Logger (Production Pattern)", () => {
  test.afterEach(() => {
    // Clean up instance loggers
  });

  test("external logger receives all logs from v3Logger", () => {
    const instanceId = "v3-instance-with-external";
    const externalLogs: LogLine[] = [];

    // Simulate V3 constructor behavior with external logger
    const externalLogger = (line: LogLine) => {
      externalLogs.push(line);
    };

    bindInstanceLogger(instanceId, externalLogger);

    try {
      withInstanceLogContext(instanceId, () => {
        v3Logger({
          category: "a11y/snapshot",
          message: "Capturing hybrid snapshot",
          level: 0,
        });

        v3Logger({
          category: "handlers/act",
          message: "Executing action",
          level: 1,
          auxiliary: {
            action: { value: "click", type: "string" },
          },
        });

        v3Logger({
          category: "debug",
          message: "Debug details",
          level: 2,
        });
      });

      // All logs should be captured by external logger
      expect(externalLogs.length).toBe(3);
      expect(externalLogs[0].message).toBe("Capturing hybrid snapshot");
      expect(externalLogs[1].message).toBe("Executing action");
      expect(externalLogs[2].message).toBe("Debug details");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("StagehandLogger wrapper forwards to external logger", () => {
    const instanceId = "v3-with-stagehand-wrapper";
    const externalLogs: LogLine[] = [];

    // Simulate V3's stagehandLogger.log() wrapping pattern
    const mockStagehandLogger = {
      log: (line: LogLine) => {
        // This simulates StagehandLogger.log() which internally calls externalLogger
        externalLogs.push(line);
      },
    };

    bindInstanceLogger(instanceId, (line) => mockStagehandLogger.log(line));

    try {
      withInstanceLogContext(instanceId, () => {
        v3Logger({
          category: "test",
          message: "Log through StagehandLogger wrapper",
          level: 1,
        });
      });

      expect(externalLogs.length).toBe(1);
      expect(externalLogs[0].message).toBe(
        "Log through StagehandLogger wrapper",
      );
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("multiple V3 instances with different external loggers", () => {
    const instance1Id = "v3-instance-1";
    const instance2Id = "v3-instance-2";
    const external1Logs: LogLine[] = [];
    const external2Logs: LogLine[] = [];

    // Simulate two V3 instances with different external loggers
    bindInstanceLogger(instance1Id, (line) => external1Logs.push(line));
    bindInstanceLogger(instance2Id, (line) => external2Logs.push(line));

    try {
      // Instance 1 logs
      withInstanceLogContext(instance1Id, () => {
        v3Logger({
          category: "instance1",
          message: "Instance 1 activity",
          level: 1,
        });
      });

      // Instance 2 logs
      withInstanceLogContext(instance2Id, () => {
        v3Logger({
          category: "instance2",
          message: "Instance 2 activity",
          level: 1,
        });
      });

      // Each external logger should only have its instance's logs
      expect(external1Logs.length).toBe(1);
      expect(external2Logs.length).toBe(1);
      expect(external1Logs[0].message).toBe("Instance 1 activity");
      expect(external2Logs[0].message).toBe("Instance 2 activity");
    } finally {
      unbindInstanceLogger(instance1Id);
      unbindInstanceLogger(instance2Id);
    }
  });

  test("external logger receives logs with auxiliary data preserved", () => {
    const instanceId = "v3-with-auxiliary";
    const externalLogs: LogLine[] = [];

    bindInstanceLogger(instanceId, (line) => externalLogs.push(line));

    try {
      withInstanceLogContext(instanceId, () => {
        v3Logger({
          category: "extract",
          message: "Extracting data",
          level: 1,
          auxiliary: {
            selector: { value: "xpath=/html/body", type: "string" },
            timeout: { value: "5000", type: "integer" },
            retries: { value: "3", type: "integer" },
            metadata: {
              value: JSON.stringify({ key: "value" }),
              type: "object",
            },
          },
        });
      });

      expect(externalLogs.length).toBe(1);
      const log = externalLogs[0];
      expect(log.auxiliary).toBeDefined();
      expect(log.auxiliary?.selector?.value).toBe("xpath=/html/body");
      expect(log.auxiliary?.timeout?.value).toBe("5000");
      expect(log.auxiliary?.retries?.value).toBe("3");
      expect(log.auxiliary?.metadata?.type).toBe("object");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("external logger handles rapid concurrent logs", () => {
    const instanceId = "v3-rapid-logs";
    const externalLogs: LogLine[] = [];

    bindInstanceLogger(instanceId, (line) => externalLogs.push(line));

    try {
      withInstanceLogContext(instanceId, () => {
        // Simulate rapid logging like during snapshot capture
        for (let i = 0; i < 50; i++) {
          v3Logger({
            category: "perf",
            message: `Operation ${i}`,
            level: 2,
            auxiliary: {
              iteration: { value: String(i), type: "integer" },
            },
          });
        }
      });

      // All logs should be captured
      expect(externalLogs.length).toBe(50);
      expect(externalLogs[0].message).toBe("Operation 0");
      expect(externalLogs[49].message).toBe("Operation 49");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("external logger can filter by log level", () => {
    const instanceId = "v3-with-filtering";
    const errorLogs: LogLine[] = [];

    // External logger that only captures errors
    const filteringLogger = (line: LogLine) => {
      if (line.level === 0) {
        errorLogs.push(line);
      }
    };

    bindInstanceLogger(instanceId, filteringLogger);

    try {
      withInstanceLogContext(instanceId, () => {
        v3Logger({
          category: "test",
          message: "Info message",
          level: 1,
        });

        v3Logger({
          category: "test",
          message: "Error message",
          level: 0,
        });

        v3Logger({
          category: "test",
          message: "Debug message",
          level: 2,
        });

        v3Logger({
          category: "test",
          message: "Another error",
          level: 0,
        });
      });

      // Only error logs should be captured
      expect(errorLogs.length).toBe(2);
      expect(errorLogs[0].message).toBe("Error message");
      expect(errorLogs[1].message).toBe("Another error");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });

  test("external logger persists across async operations", async () => {
    const instanceId = "v3-async-ops";
    const externalLogs: LogLine[] = [];

    bindInstanceLogger(instanceId, (line) => externalLogs.push(line));

    try {
      await withInstanceLogContext(instanceId, async () => {
        v3Logger({
          category: "async",
          message: "Before async operation",
          level: 1,
        });

        await new Promise((resolve) => setTimeout(resolve, 50));

        v3Logger({
          category: "async",
          message: "After async operation",
          level: 1,
        });

        await Promise.all([
          Promise.resolve().then(() =>
            v3Logger({
              category: "async",
              message: "Parallel operation 1",
              level: 1,
            }),
          ),
          Promise.resolve().then(() =>
            v3Logger({
              category: "async",
              message: "Parallel operation 2",
              level: 1,
            }),
          ),
        ]);
      });

      // All logs should be captured despite async boundaries
      expect(externalLogs.length).toBe(4);
      expect(externalLogs[0].message).toBe("Before async operation");
      expect(externalLogs[1].message).toBe("After async operation");
    } finally {
      unbindInstanceLogger(instanceId);
    }
  });
});


================================================
FILE: packages/core/tests/integration/multi-instance-logger.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { getV3DynamicTestConfig } from "./v3.dynamic.config.js";
import type { LogLine } from "../../lib/v3/types/public/logs.js";
import { closeV3 } from "./testUtils.js";

test.describe("V3 Multi-Instance Logger Isolation", () => {
  // Run tests serially to avoid resource exhaustion from creating many Chrome instances
  test.describe.configure({ mode: "serial" });
  // Increase timeout for stress tests that create/destroy multiple instances
  test.setTimeout(120_000);

  test("multiple V3 instances can be created concurrently without logger conflicts", async () => {
    const instanceCount = 5;
    const instances: V3[] = [];
    const instanceLogs: Map<number, LogLine[]> = new Map();

    try {
      // Create multiple instances with individual loggers
      const creationPromises = Array.from({ length: instanceCount }, (_, i) => {
        const logs: LogLine[] = [];
        instanceLogs.set(i, logs);

        const config = getV3DynamicTestConfig({
          verbose: 2,
          disablePino: true,
          logger: (line: LogLine) => {
            logs.push({
              ...line,
              auxiliary: {
                ...line.auxiliary,
                index: { value: String(i), type: "integer" },
              },
            });
          },
        });

        const v3 = new V3(config);
        instances.push(v3);
        return v3.init();
      });

      // All instances should initialize successfully
      await Promise.all(creationPromises);

      // Each instance should be initialized
      expect(instances.length).toBe(instanceCount);
      for (const instance of instances) {
        expect(instance.context).toBeDefined();
      }

      // Perform operations that generate logs
      await Promise.all(
        instances.map(async (instance) => {
          const page = await instance.context.awaitActivePage();
          await page.goto("about:blank");
        }),
      );

      // Each instance should have logged to its own logger
      for (let i = 0; i < instanceCount; i++) {
        const logs = instanceLogs.get(i)!;
        // Each instance should have some logs
        expect(logs.length).toBeGreaterThan(0);

        // Logs should not contain data from other instances
        // (though this is harder to verify without more specific markers)
        const hasOwnLogs = logs.some(
          (log) =>
            log.auxiliary?.index?.value === String(i) ||
            log.category === "init",
        );
        expect(hasOwnLogs).toBe(true);
      }
    } finally {
      // Clean up all instances
      await Promise.all(instances.map((instance) => closeV3(instance)));
    }
  });

  test("V3 instances with external loggers don't leak logs to each other", async () => {
    const instance1Logs: LogLine[] = [];
    const instance2Logs: LogLine[] = [];

    const v3Instance1 = new V3(
      getV3DynamicTestConfig({
        verbose: 2,
        disablePino: true,
        logger: (line: LogLine) => instance1Logs.push(line),
      }),
    );

    const v3Instance2 = new V3(
      getV3DynamicTestConfig({
        verbose: 2,
        disablePino: true,
        logger: (line: LogLine) => instance2Logs.push(line),
      }),
    );

    try {
      // Initialize both instances
      await Promise.all([v3Instance1.init(), v3Instance2.init()]);

      // Perform operations on each instance
      const page1 = await v3Instance1.context.awaitActivePage();
      await page1.goto("about:blank");

      const page2 = await v3Instance2.context.awaitActivePage();
      await page2.goto("data:text/html,<h1>Instance 2</h1>");

      // Both instances should have logs
      expect(instance1Logs.length).toBeGreaterThan(0);
      expect(instance2Logs.length).toBeGreaterThan(0);

      // Logs should be distinct (no exact duplicates)
      // This is a weak check, but verifies basic isolation
      const instance1Messages = new Set(instance1Logs.map((l) => l.message));
      const instance2Messages = new Set(instance2Logs.map((l) => l.message));

      // At least some messages should be unique to each instance
      // (This might not always be true for very generic messages like "init",
      // but serves as a smoke test)
      const allMessages = new Set([...instance1Messages, ...instance2Messages]);
      expect(allMessages.size).toBeGreaterThanOrEqual(
        Math.max(instance1Messages.size, instance2Messages.size),
      );
    } finally {
      await Promise.all([closeV3(v3Instance1), closeV3(v3Instance2)]);
    }
  });

  test("V3 instances without external loggers use shared global logger", async () => {
    // Create instances without external loggers
    const v3Instance1 = new V3(
      getV3DynamicTestConfig({
        verbose: 1,
        disablePino: true,
      }),
    );

    const v3Instance2 = new V3(
      getV3DynamicTestConfig({
        verbose: 1,
        disablePino: true,
      }),
    );

    try {
      // Initialize both instances concurrently
      await Promise.all([v3Instance1.init(), v3Instance2.init()]);

      // Both should work fine
      expect(v3Instance1.context).toBeDefined();
      expect(v3Instance2.context).toBeDefined();

      // Perform basic operations to ensure logging doesn't cause issues
      const page1 = await v3Instance1.context.awaitActivePage();
      const page2 = await v3Instance2.context.awaitActivePage();

      await Promise.all([page1.goto("about:blank"), page2.goto("about:blank")]);

      // Both should still be operational
      expect(page1.url()).toContain("about:blank");
      expect(page2.url()).toContain("about:blank");
    } finally {
      await Promise.all([closeV3(v3Instance1), closeV3(v3Instance2)]);
    }
  });

  test("rapidly creating and destroying instances doesn't cause logger issues", async () => {
    const iterations = 5;
    const results: boolean[] = [];

    for (let i = 0; i < iterations; i++) {
      const logs: LogLine[] = [];
      const v3 = new V3(
        getV3DynamicTestConfig({
          verbose: 1, // Capture INFO logs for verification
          disablePino: true,
          logger: (line: LogLine) => logs.push(line),
        }),
      );

      try {
        await v3.init();
        const page = await v3.context.awaitActivePage();
        await page.goto("about:blank");
        results.push(true);

        // Verify some logs were captured
        expect(logs.length).toBeGreaterThan(0);
      } finally {
        await closeV3(v3);
      }
    }

    // All iterations should succeed
    expect(results.length).toBe(iterations);
    expect(results.every((r) => r === true)).toBe(true);
  });

  test("concurrent instance creation with mixed logger configurations", async () => {
    const instances: V3[] = [];
    const configs = [
      // With Pino disabled
      getV3DynamicTestConfig({ verbose: 1, disablePino: true }),
      // With external logger
      getV3DynamicTestConfig({
        verbose: 2,
        disablePino: true,
        //eslint-disable-next-line @typescript-eslint/no-unused-vars
        logger: (_line: LogLine) => {
          // External logger
        },
      }),
      // Without external logger
      getV3DynamicTestConfig({ verbose: 0, disablePino: true }),
      // High verbosity
      getV3DynamicTestConfig({ verbose: 2, disablePino: true }),
    ];

    try {
      // Create all instances concurrently
      const creationPromises = configs.map((config) => {
        const v3 = new V3(config);
        instances.push(v3);
        return v3.init();
      });

      await Promise.all(creationPromises);

      // All should be initialized successfully
      expect(instances.length).toBe(configs.length);
      for (const instance of instances) {
        expect(instance.context).toBeDefined();
      }

      // All should be able to perform operations
      await Promise.all(
        instances.map(async (instance) => {
          const page = await instance.context.awaitActivePage();
          await page.goto("about:blank");
          expect(page.url()).toContain("about:blank");
        }),
      );
    } finally {
      await Promise.all(instances.map((instance) => closeV3(instance)));
    }
  });

  test("V3 instance logger is properly cleaned up on close", async () => {
    const logs: LogLine[] = [];
    const v3 = new V3(
      getV3DynamicTestConfig({
        verbose: 2,
        disablePino: true,
        logger: (line: LogLine) => logs.push(line),
      }),
    );

    await v3.init();
    const initialLogCount = logs.length;
    expect(initialLogCount).toBeGreaterThan(0);

    await closeV3(v3);

    // After close, the instance should not generate new logs
    // (This is hard to test directly, but we can verify the instance is closed)
    expect(v3["state"].kind).toBe("UNINITIALIZED");
  });

  test("logger works correctly across instance lifecycle", async () => {
    const logs: LogLine[] = [];
    const v3 = new V3(
      getV3DynamicTestConfig({
        verbose: 2,
        disablePino: true,
        logger: (line: LogLine) => logs.push(line),
      }),
    );

    try {
      // Before init
      expect(logs.length).toBe(0);

      // After init
      await v3.init();
      const afterInitCount = logs.length;
      expect(afterInitCount).toBeGreaterThan(0);

      // During operation
      const page = await v3.context.awaitActivePage();
      await page.goto("data:text/html,<h1>Test</h1>");
      const afterOperationCount = logs.length;
      expect(afterOperationCount).toBeGreaterThanOrEqual(afterInitCount);

      // Verify log structure
      const initLogs = logs.filter((log) => log.category === "init");
      expect(initLogs.length).toBeGreaterThan(0);

      // All logs should have required fields
      for (const log of logs) {
        expect(log.category).toBeDefined();
        expect(log.message).toBeDefined();
        expect(typeof log.level).toBe("number");
      }
    } finally {
      await closeV3(v3);
    }
  });

  test("multiple instances can navigate concurrently without logger interference", async () => {
    const instanceCount = 3;
    const instances: V3[] = [];
    const instanceLogs: Map<number, LogLine[]> = new Map();

    try {
      // Create instances
      for (let i = 0; i < instanceCount; i++) {
        const logs: LogLine[] = [];
        instanceLogs.set(i, logs);

        const v3 = new V3(
          getV3DynamicTestConfig({
            verbose: 1,
            disablePino: true,
            logger: (line: LogLine) => logs.push(line),
          }),
        );

        instances.push(v3);
        await v3.init();
      }

      // Navigate all instances concurrently to different URLs
      const urls = [
        "data:text/html,<h1>Page 1</h1>",
        "data:text/html,<h1>Page 2</h1>",
        "data:text/html,<h1>Page 3</h1>",
      ];

      await Promise.all(
        instances.map(async (instance, i) => {
          const page = await instance.context.awaitActivePage();
          await page.goto(urls[i]);
        }),
      );

      // Verify each instance navigated to the correct URL
      for (let i = 0; i < instanceCount; i++) {
        const page = await instances[i].context.awaitActivePage();
        expect(page.url()).toContain(`Page ${i + 1}`);
      }

      // Each instance should have its own logs
      for (let i = 0; i < instanceCount; i++) {
        const logs = instanceLogs.get(i)!;
        expect(logs.length).toBeGreaterThan(0);
      }
    } finally {
      await Promise.all(instances.map((instance) => closeV3(instance)));
    }
  });
});


================================================
FILE: packages/core/tests/integration/nested-div.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { captureHybridSnapshot } from "../../lib/v3/understudy/a11y/snapshot/index.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("tests captureHybridSnapshot() does not break due to -32000 Failed to convert response to JSON: CBOR: stack limit exceeded", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("captureHybridSnapshot does not throw", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/nested-div/",
    );

    await expect(captureHybridSnapshot(page)).resolves.toBeDefined();
  });
});


================================================
FILE: packages/core/tests/integration/page-addInitScript.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { V3Context } from "../../lib/v3/understudy/context.js";

const EXAMPLE_URL = "https://example.com";

test.describe("page.addInitScript", () => {
  let v3: V3;
  let ctx: V3Context;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
    ctx = v3.context;
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("runs scripts on real network navigations", async () => {
    const page = await ctx.awaitActivePage();

    await page.addInitScript(() => {
      (window as unknown as { __fromPageInit?: string }).__fromPageInit =
        "page-level";
    });

    await page.goto(EXAMPLE_URL, { waitUntil: "domcontentloaded" });

    const observed = await page.evaluate(() => {
      return (window as unknown as { __fromPageInit?: string }).__fromPageInit;
    });

    expect(observed).toBe("page-level");
  });

  test("scopes scripts to the page only", async () => {
    const first = await ctx.awaitActivePage();

    await first.addInitScript(`
      (function () {
        function markScope() {
          var root = document.documentElement;
          if (!root) return;
          root.dataset.scopeWitness = "page-one";
        }
        if (document.readyState === "loading") {
          document.addEventListener("DOMContentLoaded", markScope, {
            once: true,
          });
        } else {
          markScope();
        }
      })();
    `);

    await first.goto(`${EXAMPLE_URL}/?page=one`, {
      waitUntil: "domcontentloaded",
    });

    const second = await ctx.newPage();
    await second.goto(`${EXAMPLE_URL}/?page=two`, {
      waitUntil: "domcontentloaded",
    });

    const firstValue = await first.evaluate(() => {
      return document.documentElement.dataset.scopeWitness ?? "missing";
    });
    const secondValue = await second.evaluate(() => {
      return document.documentElement.dataset.scopeWitness ?? "missing";
    });

    expect(firstValue).toBe("page-one");
    expect(secondValue).toBe("missing");
  });

  test("supports passing arguments to function sources", async () => {
    const page = await ctx.awaitActivePage();
    const payload = { greeting: "hi", nested: { count: 1 } };

    const initPayload = ((arg) => {
      function setPayload() {
        const root = document.documentElement;
        if (!root) return;
        root.dataset.pageInitPayload = JSON.stringify(arg);
      }
      if (document.readyState === "loading") {
        document.addEventListener("DOMContentLoaded", setPayload, {
          once: true,
        });
      } else {
        setPayload();
      }
    }) as (arg: typeof payload) => void;
    await page.addInitScript(initPayload, payload);

    await page.goto(`${EXAMPLE_URL}/?page=payload`, {
      waitUntil: "domcontentloaded",
    });

    const observed = await page.evaluate(() => {
      const raw = document.documentElement.dataset.pageInitPayload;
      return raw ? JSON.parse(raw) : undefined;
    });

    expect(observed).toEqual(payload);
  });
});


================================================
FILE: packages/core/tests/integration/page-console.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Page console events", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("captures console messages emitted by the page", async () => {
    const browserTarget = (
      process.env.STAGEHAND_BROWSER_TARGET ?? "local"
    ).toLowerCase();
    const isBrowserbase = browserTarget === "browserbase";
    if (isBrowserbase) {
      console.warn(
        "[page-console] TODO: re-enable once BB cloud browsers support Runtime.consoleAPICalled events again. See https://browserbase.slack.com/archives/C06U6CM7YS1/p1769483322836589",
      );
      test.skip(
        true,
        "TODO: re-enable once BB cloud browsers support Runtime.consoleAPICalled events again.",
      );
    }
    const page = v3.context.pages()[0];
    const received: Array<{ type: string; text: string }> = [];

    page.on("console", (message) => {
      received.push({ type: message.type(), text: message.text() });
    });

    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-hn/",
    );

    await page.evaluate(() => {
      console.log("stagehand console", { ok: true });
      console.error("stagehand console error");
    });

    const waitForConsole = async (
      predicate: () => boolean,
      timeoutMs = 2000,
    ) => {
      const deadline = Date.now() + timeoutMs;
      while (Date.now() < deadline) {
        if (predicate()) return;
        await new Promise((resolve) => setTimeout(resolve, 50));
      }
    };

    await waitForConsole(
      () =>
        received.some((m) => m.type === "log") &&
        received.some((m) => m.type === "error" && m.text.includes("error")),
      5000,
    );

    expect(received.length).toBeGreaterThanOrEqual(2);
    expect(received.some((m) => m.type === "log")).toBeTruthy();
    expect(
      received.some((m) => m.type === "error" && m.text.includes("error")),
    ).toBeTruthy();
  });
});


================================================
FILE: packages/core/tests/integration/page-drag-and-drop.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Page.dragAndDrop() - dragging elements", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("drags and drops element to target zone", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { font-family: Arial; margin: 0; padding: 20px; }
              .container { display: flex; gap: 20px; }
              .source-box {
                width: 150px;
                height: 100px;
                background: lightblue;
                border: 2px solid blue;
                display: flex;
                align-items: center;
                justify-content: center;
                cursor: move;
                user-select: none;
              }
              .drop-zone {
                width: 200px;
                height: 150px;
                background: lightyellow;
                border: 2px dashed orange;
                display: flex;
                align-items: center;
                justify-content: center;
              }
              .result { margin-top: 20px; font-weight: bold; }
            </style>
          </head>
          <body>
            <div class="container">
              <div id="source" class="source-box" draggable="true">Drag Me</div>
              <div id="dropZone" class="drop-zone">Drop Here</div>
            </div>
            <div id="result" class="result">Status: Waiting</div>
            <script>
              const source = document.getElementById('source');
              const dropZone = document.getElementById('dropZone');
              const result = document.getElementById('result');
              
              source.addEventListener('dragstart', (e) => {
                e.dataTransfer.effectAllowed = 'move';
                e.dataTransfer.setData('text/plain', 'Dragged Element');
              });
              
              dropZone.addEventListener('dragover', (e) => {
                e.preventDefault();
                e.dataTransfer.dropEffect = 'move';
                dropZone.style.background = 'lightgreen';
              });
              
              dropZone.addEventListener('dragleave', () => {
                dropZone.style.background = 'lightyellow';
              });
              
              dropZone.addEventListener('drop', (e) => {
                e.preventDefault();
                result.textContent = 'Status: DROP SUCCESSFUL';
                result.style.color = 'green';
                dropZone.style.background = 'lightgreen';
              });
            </script>
          </body>
          </html>
        `),
    );

    // Get coordinates for drag and drop
    const sourceLocation = await page
      .frames()[0]
      .getLocationForSelector("#source");
    const dropZoneLocation = await page
      .frames()[0]
      .getLocationForSelector("#dropZone");

    const fromX = sourceLocation.x + sourceLocation.width / 2;
    const fromY = sourceLocation.y + sourceLocation.height / 2;
    const toX = dropZoneLocation.x + dropZoneLocation.width / 2;
    const toY = dropZoneLocation.y + dropZoneLocation.height / 2;

    // Perform drag and drop
    await page.dragAndDrop(fromX, fromY, toX, toY);

    // Wait for events to be processed
    await page.evaluate(() => new Promise((r) => setTimeout(r, 100)));

    // Verify visual result
    const resultText = await page.evaluate(
      () => document.getElementById("result").textContent,
    );
    expect(resultText).toContain("DROP SUCCESSFUL");
  });

  test("drag and drop with steps parameter", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { margin: 0; padding: 20px; }
              .box {
                width: 100px;
                height: 100px;
                background: lightblue;
                margin: 20px;
                cursor: move;
              }
              .target {
                width: 200px;
                height: 200px;
                background: lightyellow;
                margin: 20px;
                border: 2px dashed orange;
              }
            </style>
          </head>
          <body>
            <div id="box" class="box" draggable="true"></div>
            <div id="target" class="target"></div>
            <div id="status">Not dropped</div>
            <script>
              document.getElementById('box').addEventListener('dragstart', (e) => {
                e.dataTransfer.effectAllowed = 'move';
              });
              document.getElementById('target').addEventListener('drop', (e) => {
                e.preventDefault();
                document.getElementById('status').textContent = 'Dropped with steps';
              });
              document.getElementById('target').addEventListener('dragover', (e) => {
                e.preventDefault();
              });
            </script>
          </body>
          </html>
        `),
    );

    const boxLocation = await page.frames()[0].getLocationForSelector("#box");
    const targetLocation = await page
      .frames()[0]
      .getLocationForSelector("#target");

    const fromX = boxLocation.x + boxLocation.width / 2;
    const fromY = boxLocation.y + boxLocation.height / 2;
    const toX = targetLocation.x + targetLocation.width / 2;
    const toY = targetLocation.y + targetLocation.height / 2;

    // Drag with multiple steps for smoother motion
    await page.dragAndDrop(fromX, fromY, toX, toY, { steps: 5 });

    // Wait for events to be processed
    await page.evaluate(() => new Promise((r) => setTimeout(r, 100)));

    const status = await page.evaluate(
      () => document.getElementById("status").textContent,
    );
    expect(status).toContain("Dropped");
  });

  test("drag and drop with delay between steps", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { margin: 0; padding: 20px; }
              #dragItem { width: 80px; height: 80px; background: lightcoral; cursor: move; }
              #dropArea { width: 150px; height: 150px; background: lightgray; margin-top: 20px; }
            </style>
          </head>
          <body>
            <div id="dragItem" draggable="true"></div>
            <div id="dropArea"></div>
            <div id="complete">false</div>
            <script>
              const item = document.getElementById('dragItem');
              const area = document.getElementById('dropArea');
              const complete = document.getElementById('complete');
              
              item.addEventListener('dragstart', (e) => {
                e.dataTransfer.effectAllowed = 'move';
              });
              
              area.addEventListener('drop', (e) => {
                e.preventDefault();
                complete.textContent = 'true';
              });
              
              area.addEventListener('dragover', (e) => {
                e.preventDefault();
              });
            </script>
          </body>
          </html>
        `),
    );

    const itemLocation = await page
      .frames()[0]
      .getLocationForSelector("#dragItem");
    const areaLocation = await page
      .frames()[0]
      .getLocationForSelector("#dropArea");

    const fromX = itemLocation.x + itemLocation.width / 2;
    const fromY = itemLocation.y + itemLocation.height / 2;
    const toX = areaLocation.x + areaLocation.width / 2;
    const toY = areaLocation.y + areaLocation.height / 2;

    // Drag with delay between steps
    await page.dragAndDrop(fromX, fromY, toX, toY, { steps: 3, delay: 50 });

    // Wait for events to be processed
    await page.evaluate(() => new Promise((r) => setTimeout(r, 100)));

    const isComplete = await page.evaluate(
      () => document.getElementById("complete").textContent === "true",
    );
    expect(isComplete).toBe(true);
  });

  test("drag and drop returns xpath when requested", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { margin: 20px; }
              #source { width: 100px; height: 100px; background: blue; cursor: move; }
              #target { width: 150px; height: 150px; background: green; margin-top: 20px; }
            </style>
          </head>
          <body>
            <div id="source" draggable="true"></div>
            <div id="target"></div>
            <script>
              document.getElementById('source').addEventListener('dragstart', (e) => {
                e.dataTransfer.effectAllowed = 'move';
              });
              document.getElementById('target').addEventListener('drop', (e) => {
                e.preventDefault();
              });
              document.getElementById('target').addEventListener('dragover', (e) => {
                e.preventDefault();
              });
            </script>
          </body>
          </html>
        `),
    );

    const sourceLocation = await page
      .frames()[0]
      .getLocationForSelector("#source");
    const targetLocation = await page
      .frames()[0]
      .getLocationForSelector("#target");

    const fromX = sourceLocation.x + sourceLocation.width / 2;
    const fromY = sourceLocation.y + sourceLocation.height / 2;
    const toX = targetLocation.x + targetLocation.width / 2;
    const toY = targetLocation.y + targetLocation.height / 2;

    const [fromXpath, toXpath] = await page.dragAndDrop(
      fromX,
      fromY,
      toX,
      toY,
      {
        returnXpath: true,
      },
    );

    // Should return xpaths for both start and end positions
    expect(typeof fromXpath).toBe("string");
    expect(typeof toXpath).toBe("string");
    expect(fromXpath.length).toBeGreaterThan(0);
    expect(toXpath.length).toBeGreaterThan(0);
  });

  test("drag and drop without returnXpath returns empty strings", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { margin: 20px; }
              #item1 { width: 80px; height: 80px; background: red; cursor: move; }
              #item2 { width: 100px; height: 100px; background: yellow; margin-top: 20px; }
            </style>
          </head>
          <body>
            <div id="item1" draggable="true"></div>
            <div id="item2"></div>
            <script>
              document.getElementById('item1').addEventListener('dragstart', (e) => {
                e.dataTransfer.effectAllowed = 'move';
              });
              document.getElementById('item2').addEventListener('drop', (e) => {
                e.preventDefault();
              });
              document.getElementById('item2').addEventListener('dragover', (e) => {
                e.preventDefault();
              });
            </script>
          </body>
          </html>
        `),
    );

    const item1Location = await page
      .frames()[0]
      .getLocationForSelector("#item1");
    const item2Location = await page
      .frames()[0]
      .getLocationForSelector("#item2");

    const fromX = item1Location.x + item1Location.width / 2;
    const fromY = item1Location.y + item1Location.height / 2;
    const toX = item2Location.x + item2Location.width / 2;
    const toY = item2Location.y + item2Location.height / 2;

    const [fromXpath, toXpath] = await page.dragAndDrop(fromX, fromY, toX, toY);

    // Should return empty strings when returnXpath is not set
    expect(fromXpath).toBe("");
    expect(toXpath).toBe("");
  });

  test("drag and drop with different mouse buttons", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { margin: 20px; }
              .draggable { width: 100px; height: 100px; background: lightblue; cursor: move; }
              .drop-area { width: 200px; height: 200px; background: lightgray; margin-top: 20px; }
            </style>
          </head>
          <body>
            <div id="source" class="draggable" draggable="true"></div>
            <div id="target" class="drop-area"></div>
            <div id="buttonUsed">none</div>
            <script>
              document.getElementById('source').addEventListener('dragstart', (e) => {
                e.dataTransfer.effectAllowed = 'move';
              });
              document.getElementById('target').addEventListener('drop', (e) => {
                e.preventDefault();
                document.getElementById('buttonUsed').textContent = 'left';
              });
              document.getElementById('target').addEventListener('dragover', (e) => {
                e.preventDefault();
              });
            </script>
          </body>
          </html>
        `),
    );

    const sourceLocation = await page
      .frames()[0]
      .getLocationForSelector("#source");
    const targetLocation = await page
      .frames()[0]
      .getLocationForSelector("#target");

    const fromX = sourceLocation.x + sourceLocation.width / 2;
    const fromY = sourceLocation.y + sourceLocation.height / 2;
    const toX = targetLocation.x + targetLocation.width / 2;
    const toY = targetLocation.y + targetLocation.height / 2;

    // Test with left button (default)
    await page.dragAndDrop(fromX, fromY, toX, toY, { button: "left" });

    // Wait for events to be processed
    await page.evaluate(() => new Promise((r) => setTimeout(r, 100)));

    const buttonUsed = await page.evaluate(
      () => document.getElementById("buttonUsed").textContent,
    );
    expect(buttonUsed).toBe("left");
  });

  test("multiple sequential drag and drops", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
          <!doctype html>
          <html>
          <head>
            <style>
              body { margin: 20px; font-family: Arial; }
              .item { width: 80px; height: 80px; background: lightblue; margin: 10px; cursor: move; display: inline-block; }
              .zone { width: 150px; height: 150px; background: lightyellow; margin: 10px; display: inline-block; border: 2px dashed orange; }
              #log { margin-top: 20px; }
            </style>
          </head>
          <body>
            <div id="item1" class="item" draggable="true">Item 1</div>
            <div id="zone1" class="zone"></div>
            <div id="item2" class="item" draggable="true">Item 2</div>
            <div id="zone2" class="zone"></div>
            <div id="log">Drops: 0</div>
            <script>
              let dropCount = 0;
              const items = ['item1', 'item2'];
              const zones = ['zone1', 'zone2'];
              
              items.forEach(id => {
                document.getElementById(id).addEventListener('dragstart', (e) => {
                  e.dataTransfer.effectAllowed = 'move';
                });
              });
              
              zones.forEach(id => {
                const zone = document.getElementById(id);
                zone.addEventListener('drop', (e) => {
                  e.preventDefault();
                  dropCount++;
                  document.getElementById('log').textContent = 'Drops: ' + dropCount;
                });
                zone.addEventListener('dragover', (e) => {
                  e.preventDefault();
                });
              });
            </script>
          </body>
          </html>
        `),
    );

    const item1Location = await page
      .frames()[0]
      .getLocationForSelector("#item1");
    const zone1Location = await page
      .frames()[0]
      .getLocationForSelector("#zone1");

    const from1X = item1Location.x + item1Location.width / 2;
    const from1Y = item1Location.y + item1Location.height / 2;
    const to1X = zone1Location.x + zone1Location.width / 2;
    const to1Y = zone1Location.y + zone1Location.height / 2;

    await page.dragAndDrop(from1X, from1Y, to1X, to1Y);

    await page.evaluate(() => new Promise((r) => setTimeout(r, 100)));

    let dropCountText = await page.evaluate(
      () => document.getElementById("log").textContent,
    );
    expect(dropCountText).toContain("Drops: 1");

    const item2Location = await page
      .frames()[0]
      .getLocationForSelector("#item2");
    const zone2Location = await page
      .frames()[0]
      .getLocationForSelector("#zone2");

    const from2X = item2Location.x + item2Location.width / 2;
    const from2Y = item2Location.y + item2Location.height / 2;
    const to2X = zone2Location.x + zone2Location.width / 2;
    const to2Y = zone2Location.y + zone2Location.height / 2;

    await page.dragAndDrop(from2X, from2Y, to2X, to2Y);

    // Wait for events to be processed
    await page.evaluate(() => new Promise((r) => setTimeout(r, 100)));

    dropCountText = await page.evaluate(
      () => document.getElementById("log").textContent,
    );
    expect(dropCountText).toContain("Drops: 2");
  });
});


================================================
FILE: packages/core/tests/integration/page-extra-http-headers.spec.ts
================================================
import { test, expect } from "@playwright/test";
import type { Protocol } from "devtools-protocol";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { closeV3 } from "./testUtils.js";

const TEST_URL =
  "https://browserbase.github.io/stagehand-eval-sites/sites/example/";

test.describe("page.setExtraHTTPHeaders", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("applies headers to navigation requests", async () => {
    const ctx = v3.context;
    const page = await ctx.awaitActivePage();

    await page.setExtraHTTPHeaders({ "x-page-header": "from-page" });

    const internal = page as unknown as {
      mainSession: {
        send: (method: string, params?: unknown) => Promise<unknown>;
        on: (event: string, handler: (params: unknown) => void) => void;
        off: (event: string, handler: (params: unknown) => void) => void;
      };
    };

    await internal.mainSession.send("Network.enable");

    const requestPromise = new Promise<Protocol.Network.RequestWillBeSentEvent>(
      (resolve, reject) => {
        const timeout = setTimeout(() => {
          internal.mainSession.off("Network.requestWillBeSent", handler);
          reject(new Error("Timed out waiting for request"));
        }, 5000);

        const handler = (evt: Protocol.Network.RequestWillBeSentEvent) => {
          if (evt.type !== "Document") return;
          const url = String(evt.request?.url ?? "");
          if (!url.startsWith(TEST_URL)) return;
          clearTimeout(timeout);
          internal.mainSession.off("Network.requestWillBeSent", handler);
          resolve(evt);
        };

        internal.mainSession.on("Network.requestWillBeSent", handler);
      },
    );

    await page.goto(TEST_URL, { waitUntil: "domcontentloaded" });

    const request = await requestPromise;
    const headers = Object.fromEntries(
      Object.entries(request.request.headers ?? {}).map(([key, value]) => [
        key.toLowerCase(),
        String(value),
      ]),
    );

    expect(headers["x-page-header"]).toBe("from-page");
  });

  test("updated headers replace previous ones", async () => {
    const ctx = v3.context;
    const page = await ctx.awaitActivePage();

    const internal = page as unknown as {
      mainSession: {
        send: (method: string, params?: unknown) => Promise<unknown>;
        on: (event: string, handler: (params: unknown) => void) => void;
        off: (event: string, handler: (params: unknown) => void) => void;
      };
    };

    await internal.mainSession.send("Network.enable");

    // Set initial headers and navigate
    await page.setExtraHTTPHeaders({ "x-first": "yes" });
    await page.goto(TEST_URL, { waitUntil: "domcontentloaded" });

    // Update headers
    await page.setExtraHTTPHeaders({ "x-second": "yes" });

    const requestPromise = new Promise<Protocol.Network.RequestWillBeSentEvent>(
      (resolve, reject) => {
        const timeout = setTimeout(() => {
          internal.mainSession.off("Network.requestWillBeSent", handler);
          reject(new Error("Timed out waiting for request"));
        }, 5000);

        const handler = (evt: Protocol.Network.RequestWillBeSentEvent) => {
          if (evt.type !== "Document") return;
          const url = String(evt.request?.url ?? "");
          if (!url.startsWith(TEST_URL)) return;
          clearTimeout(timeout);
          internal.mainSession.off("Network.requestWillBeSent", handler);
          resolve(evt);
        };

        internal.mainSession.on("Network.requestWillBeSent", handler);
      },
    );

    await page.goto(TEST_URL, { waitUntil: "domcontentloaded" });

    const request = await requestPromise;
    const headers = Object.fromEntries(
      Object.entries(request.request.headers ?? {}).map(([key, value]) => [
        key.toLowerCase(),
        String(value),
      ]),
    );

    expect(headers["x-second"]).toBe("yes");
    expect(headers["x-first"]).toBeUndefined();
  });
});


================================================
FILE: packages/core/tests/integration/page-goto-response.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Page.goto() response surface", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("returns a response object for network navigations", async () => {
    const page = v3.context.pages()[0];

    const response = await page.goto("https://example.com");

    expect(response).not.toBeNull();
    expect(response!.status()).toBe(200);
    expect(response!.ok()).toBeTruthy();

    const headers = await response.headersArray();
    expect(headers.length).toBeGreaterThan(0);

    const body = await response.text();
    expect(body).toContain("Example Domain");

    const finished = await response.finished();
    expect(finished).toBeNull();
  });

  test("falls back to null for data URLs", async () => {
    const page = v3.context.pages()[0];

    const response = await page.goto(
      "data:text/html,<html><body data-testid='fallback'>inline</body></html>",
    );

    expect(response).toBeNull();
  });
});


================================================
FILE: packages/core/tests/integration/page-hover.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Page.hover() - mouse hover at coordinates", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("hover triggers mouseover event at coordinates", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="margin: 0; padding: 0;">
            <div id="target" 
                 style="position: absolute; top: 100px; left: 100px; width: 200px; height: 200px; background: lightblue;"
                 onmouseover="this.dataset.hovered='true'"
                 onmouseout="this.dataset.hovered='false'">
              Hover Me
            </div>
          </body></html>`,
        ),
    );

    // Check initial state
    let hovered = await page.evaluate(() => {
      const el = document.getElementById("target");
      return el?.dataset.hovered === "true";
    });
    expect(hovered).toBe(false);

    // Hover at coordinates within the target element (200, 200 is center of the div)
    await page.hover(200, 200);

    // Verify mouseover was triggered
    hovered = await page.evaluate(() => {
      const el = document.getElementById("target");
      return el?.dataset.hovered === "true";
    });
    expect(hovered).toBe(true);
  });

  test("hover moves mouse without clicking", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="margin: 0; padding: 0;">
            <button id="btn" 
                    style="position: absolute; top: 100px; left: 100px; width: 200px; height: 100px;"
                    onclick="this.dataset.clicked='true'"
                    onmouseover="this.dataset.hovered='true'">
              Click Me
            </button>
          </body></html>`,
        ),
    );

    // Hover over the button
    await page.hover(200, 150);

    // Check that hover happened but click did not
    const state = await page.evaluate(() => {
      const btn = document.getElementById("btn");
      return {
        hovered: btn?.dataset.hovered === "true",
        clicked: btn?.dataset.clicked === "true",
      };
    });

    expect(state.hovered).toBe(true);
    expect(state.clicked).toBe(false);
  });

  test("hover returns xpath when requested", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="margin: 0; padding: 0;">
            <div id="target" style="position: absolute; top: 0px; left: 400px; width: 300px; height: 100px; background: blue;">
              Target element
            </div>
            <p style="position: absolute; top: 200px; left: 0px;">Content below</p>
          </body></html>`,
        ),
    );

    // Hover at coordinate (550, 50) which should be directly over the target div
    const xpath = await page.hover(550, 50, { returnXpath: true });

    // Should return a non-empty xpath string for the element at that coordinate
    expect(typeof xpath).toBe("string");
    expect(xpath.length).toBeGreaterThan(0);
    // Xpath should reference the div
    expect(xpath.toLowerCase()).toMatch(/div|target/);
  });

  test("hover without returnXpath returns empty string", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="margin: 0; padding: 0;">
            <div style="width: 100px; height: 100px; background: lightblue;">Content</div>
          </body></html>`,
        ),
    );

    // Hover without returnXpath
    const result = await page.hover(50, 50);

    // Should return empty string
    expect(result).toBe("");
  });

  test("hover triggers CSS :hover styles", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html>
          <head>
            <style>
              #hoverable {
                position: absolute;
                top: 100px;
                left: 100px;
                width: 200px;
                height: 200px;
                background: red;
              }
              #hoverable:hover {
                background: green;
              }
            </style>
          </head>
          <body style="margin: 0; padding: 0;">
            <div id="hoverable">Hover to change color</div>
          </body></html>`,
        ),
    );

    // Get initial background color
    let bgColor = await page.evaluate(() => {
      const el = document.getElementById("hoverable");
      return getComputedStyle(el!).backgroundColor;
    });
    expect(bgColor).toBe("rgb(255, 0, 0)"); // red

    // Hover over the element
    await page.hover(200, 200);

    // Check that CSS :hover state is applied
    bgColor = await page.evaluate(() => {
      const el = document.getElementById("hoverable");
      return getComputedStyle(el!).backgroundColor;
    });
    expect(bgColor).toBe("rgb(0, 128, 0)"); // green
  });

  test("multiple hovers move the mouse correctly", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="margin: 0; padding: 0;">
            <div id="box1" 
                 style="position: absolute; top: 0; left: 0; width: 100px; height: 100px; background: red;"
                 onmouseover="this.dataset.hovered='true'"
                 onmouseout="this.dataset.hovered='false'">
              Box 1
            </div>
            <div id="box2" 
                 style="position: absolute; top: 0; left: 200px; width: 100px; height: 100px; background: blue;"
                 onmouseover="this.dataset.hovered='true'"
                 onmouseout="this.dataset.hovered='false'">
              Box 2
            </div>
          </body></html>`,
        ),
    );

    // Hover over box1
    await page.hover(50, 50);

    let state = await page.evaluate(() => ({
      box1: document.getElementById("box1")?.dataset.hovered === "true",
      box2: document.getElementById("box2")?.dataset.hovered === "true",
    }));

    expect(state.box1).toBe(true);
    expect(state.box2).toBe(false);

    // Move hover to box2
    await page.hover(250, 50);

    state = await page.evaluate(() => ({
      box1: document.getElementById("box1")?.dataset.hovered === "true",
      box2: document.getElementById("box2")?.dataset.hovered === "true",
    }));

    expect(state.box1).toBe(false);
    expect(state.box2).toBe(true);
  });
});


================================================
FILE: packages/core/tests/integration/page-screenshot.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { promises as fs } from "fs";
import * as os from "os";
import * as path from "path";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import { Frame } from "../../lib/v3/understudy/frame.js";

const wait = (ms: number) => new Promise((resolve) => setTimeout(resolve, ms));

test.describe("Page.screenshot options", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("rejects clip combined with fullPage", async () => {
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>test</body></html>");

    await expect(
      page.screenshot({
        fullPage: true,
        clip: { x: 0, y: 0, width: 100, height: 100 },
      }),
    ).rejects.toThrow(/clip and fullPage/);
  });

  test("rejects unsupported image type", async () => {
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>noop</body></html>");

    await expect(
      page.screenshot({
        // @ts-expect-error intentional invalid type for runtime validation
        type: "webp",
      }),
    ).rejects.toThrow(/unsupported image type/);
  });

  test("rejects jpeg quality for png screenshots", async () => {
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>noop</body></html>");

    await expect(page.screenshot({ type: "png", quality: 50 })).rejects.toThrow(
      /quality option is only valid/,
    );
  });

  test("honours timeout option", async () => {
    const page = v3.context.pages()[0];
    await page.goto("data:text/html,<html><body>noop</body></html>");

    const mainFrame = page.mainFrame();
    const originalScreenshot = mainFrame.screenshot.bind(mainFrame);

    (
      mainFrame as typeof mainFrame & {
        screenshot: typeof mainFrame.screenshot;
      }
    ).screenshot = async () => {
      await wait(50);
      return Buffer.from("late");
    };

    try {
      await expect(page.screenshot({ timeout: 10 })).rejects.toThrow(
        /timed out|timeout/i,
      );
    } finally {
      (
        mainFrame as typeof mainFrame & {
          screenshot: typeof mainFrame.screenshot;
        }
      ).screenshot = originalScreenshot;
    }
  });

  test("applies advanced options and cleans up overlays", async () => {
    const page = v3.context.pages()[0];
    const screenshotTimeout = process.env.CI ? 15000 : 5000;
    const testStart = Date.now();
    console.log(
      `[screenshot-test] start ${new Date(testStart).toISOString()} timeout=${screenshotTimeout}`,
    );

    const html = `
      <!doctype html>
      <html>
        <head>
          <meta charset="utf-8" />
          <style>
            body { background: #aaccee; margin: 0; height: 100vh; display: flex; flex-direction: column; align-items: flex-start; }
            .mask-target { width: 80px; height: 80px; margin: 40px; background: rgb(0, 180, 60); animation: pulse 1s infinite alternate; }
            @keyframes pulse { from { transform: scale(1); } to { transform: scale(1.2); } }
          </style>
        </head>
        <body>
          <div class="mask-target"></div>
          <div class="mask-target"></div>
          <input id="focus-me" value="focus" />
          <script>document.getElementById('focus-me').focus();</script>
        </body>
      </html>
    `;

    await page.goto("data:text/html," + encodeURIComponent(html));
    console.log(`[screenshot-test] page loaded in ${Date.now() - testStart}ms`);

    const maskLocator = page.locator(".mask-target");
    const tempPath = path.join(
      os.tmpdir(),
      `stagehand-screenshot-${Date.now()}-${Math.random().toString(36).slice(2)}.jpeg`,
    );
    console.log(`[screenshot-test] tempPath=${tempPath}`);

    const targetId = page.targetId();
    const screenshotCalls: Array<{
      frameId: string;
      options: Parameters<Frame["screenshot"]>[0];
    }> = [];
    const evaluateCalls: Array<{ frameId: string; arg: unknown }> = [];
    const originalScreenshot = Frame.prototype.screenshot;
    const originalEvaluate = Frame.prototype.evaluate;

    // Hook Frame.screenshot so we can assert which options reach CDP without writing real data.
    Frame.prototype.screenshot = async function screenshotSpy(options) {
      const frame = this as Frame;
      if (frame.pageId === targetId) {
        screenshotCalls.push({ frameId: frame.frameId, options });
        return Buffer.from("stub-image");
      }
      return originalScreenshot.call(this, options);
    };

    // Spy on Frame.evaluate to capture the arguments used to inject CSS/masks.
    Frame.prototype.evaluate = async function evaluateSpy(expression, arg?) {
      const frame = this as Frame;
      if (frame.pageId === targetId) {
        evaluateCalls.push({ frameId: frame.frameId, arg });
      }
      return originalEvaluate.call(this, expression as never, arg);
    } as Frame["evaluate"];

    const internalPage = page as unknown as {
      mainSession: {
        send: (method: string, params?: unknown) => Promise<unknown>;
      };
    };
    const sendCalls: Array<{ method: string; params: unknown }> = [];
    const originalSend = internalPage.mainSession.send.bind(
      internalPage.mainSession,
    ) as (method: string, params?: unknown) => Promise<unknown>;
    // Capture background overrides so we can confirm omitBackground toggles on/off.
    internalPage.mainSession.send = async (
      method: string,
      params?: unknown,
    ) => {
      sendCalls.push({ method, params });
      return originalSend(method, params);
    };

    try {
      const maskCount = await maskLocator.count();
      console.log(`[screenshot-test] maskLocator.count=${maskCount}`);

      const buffer = await page.screenshot({
        animations: "disabled",
        caret: "hide",
        clip: { x: 0, y: 0, width: 200, height: 200 },
        mask: [maskLocator],
        maskColor: "rgba(255, 0, 0, 0.4)",
        omitBackground: true,
        path: tempPath,
        quality: 80,
        scale: "css",
        style: "body { border: 3px solid black; }",
        timeout: screenshotTimeout,
        type: "jpeg",
      });
      console.log(
        `[screenshot-test] screenshot returned bytes=${buffer.length} elapsed=${Date.now() - testStart}ms`,
      );

      expect(Buffer.isBuffer(buffer)).toBeTruthy();
      expect(screenshotCalls.length).toBeGreaterThanOrEqual(1);
      console.log(
        `[screenshot-test] screenshotCalls=${screenshotCalls.length} evaluateCalls=${evaluateCalls.length} sendCalls=${sendCalls.length}`,
      );
      const recorded = screenshotCalls[0]?.options ?? {};
      expect(recorded).toMatchObject({ type: "jpeg", quality: 80 });
      expect(recorded?.clip).toMatchObject({
        x: 0,
        y: 0,
        width: 200,
        height: 200,
      });
      if (typeof recorded?.scale === "number") {
        expect(recorded.scale).toBeGreaterThan(0);
        expect(recorded.scale).toBeLessThanOrEqual(2);
      }

      await fs.stat(tempPath);

      const maskNodes = await page.evaluate(
        () => document.querySelectorAll("[data-stagehand-mask]").length,
      );
      expect(maskNodes).toBe(0);

      const styleNodes = await page.evaluate(
        () => document.querySelectorAll("[data-stagehand-style]").length,
      );
      expect(styleNodes).toBe(0);

      const backgroundCalls = sendCalls.filter(
        (call) => call.method === "Emulation.setDefaultBackgroundColorOverride",
      );
      expect(backgroundCalls.length).toBeGreaterThan(1);
      expect(
        backgroundCalls.some(
          (call) =>
            call.params &&
            typeof call.params === "object" &&
            "color" in (call.params as Record<string, unknown>),
        ),
      ).toBeTruthy();
      expect(
        backgroundCalls.some(
          (call) =>
            !call.params ||
            Object.keys(call.params as Record<string, unknown>).length === 0,
        ),
      ).toBeTruthy();

      const cssArgs = evaluateCalls
        .map((entry) => {
          const value = entry.arg as { css?: string } | undefined;
          return value?.css ?? null;
        })
        .filter((css): css is string => typeof css === "string");

      const tokens = evaluateCalls
        .map((entry) => {
          const arg = entry.arg as { token?: string } | undefined;
          return arg?.token ?? null;
        })
        .filter((token): token is string => typeof token === "string");

      // Tokens include which helper injected the style (animations/caret/custom).
      expect(tokens.some((token) => token.includes("animations"))).toBeTruthy();
      expect(tokens.some((token) => token.includes("caret"))).toBeTruthy();
      expect(tokens.some((token) => token.includes("custom"))).toBeTruthy();
      // Custom style should bubble through so we check the actual CSS text.
      expect(
        cssArgs.some((css) => css.includes("border: 3px solid black")),
      ).toBeTruthy();

      const maskCalls = evaluateCalls.filter((entry) => {
        const arg = entry.arg;
        return (
          arg &&
          typeof arg === "object" &&
          "rects" in (arg as Record<string, unknown>)
        );
      });
      expect(maskCalls.length).toBeGreaterThan(0);
      const rects = (maskCalls[0]?.arg as { rects?: unknown } | undefined)
        ?.rects;
      expect(Array.isArray(rects)).toBeTruthy();
      expect((rects as unknown[]).length).toBe(2);
    } finally {
      Frame.prototype.screenshot = originalScreenshot;
      Frame.prototype.evaluate = originalEvaluate;
      internalPage.mainSession.send = originalSend;
      await fs.unlink(tempPath).catch(() => {});
    }
  });

  test("masks elements inside dialog top layer", async () => {
    const page = v3.context.pages()[0];

    const html = `
      <!doctype html>
      <html>
        <head>
          <meta charset="utf-8" />
          <style>
            dialog { padding: 16px; border: 2px solid #444; }
            #dialog-input { display: block; width: 160px; height: 32px; }
          </style>
        </head>
        <body>
          <dialog id="dialog">
            <label>Secret <input id="dialog-input" value="top-layer" /></label>
          </dialog>
          <script>
            const dialog = document.getElementById("dialog");
            if (dialog) {
              if (typeof dialog.showModal === "function") {
                try {
                  dialog.showModal();
                } catch {
                  dialog.setAttribute("open", "");
                }
              } else {
                dialog.setAttribute("open", "");
              }
            }
          </script>
        </body>
      </html>
    `;

    await page.goto("data:text/html," + encodeURIComponent(html));

    const targetId = page.targetId();
    const originalScreenshot = Frame.prototype.screenshot;
    let dialogMaskCount = 0;

    Frame.prototype.screenshot = async function screenshotSpy(options) {
      const frame = this as Frame;
      if (frame.pageId === targetId) {
        dialogMaskCount = await frame.evaluate(() => {
          const dialog = document.querySelector("dialog[open]");
          if (!dialog) return 0;
          return dialog.querySelectorAll("[data-stagehand-mask]").length;
        });
        return Buffer.from("stub-image");
      }
      return originalScreenshot.call(this, options);
    };

    try {
      await page.screenshot({
        mask: [page.locator("#dialog-input")],
      });
      expect(dialogMaskCount).toBeGreaterThan(0);
    } finally {
      Frame.prototype.screenshot = originalScreenshot;
    }
  });
});


================================================
FILE: packages/core/tests/integration/page-scroll.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Page.scroll() - mouse wheel scrolling", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("scrolls page vertically with positive deltaY", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 2000px;">
            <div style="height: 400px; background: lightblue;">Section 1</div>
            <div style="height: 400px; background: lightgreen;">Section 2</div>
            <div style="height: 400px; background: lightyellow;">Section 3</div>
            <div style="height: 400px; background: lightcoral;">Section 4</div>
            <div style="height: 400px; background: lightgray;">Section 5</div>
          </body></html>`,
        ),
    );

    // Get initial scroll position
    let scrollY = await page.evaluate(() => window.scrollY);
    expect(scrollY).toBe(0);

    // Scroll down (positive deltaY)
    await page.scroll(640, 400, 0, 300);

    // Wait for scroll to complete
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    // Check that we've scrolled down
    scrollY = await page.evaluate(() => window.scrollY);
    expect(scrollY).toBeGreaterThan(0);
  });

  test("scrolls page horizontally with positive deltaX", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="width: 2000px; height: 600px;">
            <div style="display: inline-block; width: 400px; height: 100%; background: lightblue;">Section 1</div>
            <div style="display: inline-block; width: 400px; height: 100%; background: lightgreen;">Section 2</div>
            <div style="display: inline-block; width: 400px; height: 100%; background: lightyellow;">Section 3</div>
            <div style="display: inline-block; width: 400px; height: 100%; background: lightcoral;">Section 4</div>
            <div style="display: inline-block; width: 400px; height: 100%; background: lightgray;">Section 5</div>
          </body></html>`,
        ),
    );

    let scrollX = await page.evaluate(() => window.scrollX);
    expect(scrollX).toBe(0);

    // Scroll right (positive deltaX)
    await page.scroll(640, 400, 300, 0);

    // Wait for scroll to complete
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    // Check that we've scrolled right
    scrollX = await page.evaluate(() => window.scrollX);
    expect(scrollX).toBeGreaterThan(0);
  });

  test("scrolls in both directions simultaneously", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="width: 2000px; height: 2000px;">
            <div style="width: 100%; height: 100%; background: linear-gradient(135deg, lightblue, lightcoral);">
              Diagonal content
            </div>
          </body></html>`,
        ),
    );

    // Scroll both horizontally and vertically
    await page.scroll(640, 400, 200, 200);

    // Wait for scroll to complete
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    // Check both directions changed
    const scrollPos = await page.evaluate(() => ({
      x: window.scrollX,
      y: window.scrollY,
    }));

    expect(scrollPos.x).toBeGreaterThan(0);
    expect(scrollPos.y).toBeGreaterThan(0);
  });

  test("scrolls at specific coordinate on page", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 2000px;">
            <div id="marker" style="position: fixed; top: 400px; left: 640px; width: 2px; height: 2px; background: red;"></div>
            <div style="height: 500px; background: lightblue;">Top</div>
            <div style="height: 500px; background: lightgreen;">Middle</div>
            <div style="height: 500px; background: lightyellow;">Bottom</div>
          </body></html>`,
        ),
    );

    // Scroll from specific coordinates
    await page.scroll(640, 400, 0, 400);

    // Wait for scroll to complete
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    // Verify scroll happened
    const scrollY = await page.evaluate(() => window.scrollY);
    expect(scrollY).toBeGreaterThan(0);
  });

  test("scrolls with large deltaY values", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 5000px;">
            <div style="height: 1000px; background: lightblue;">Section 1</div>
            <div style="height: 1000px; background: lightgreen;">Section 2</div>
            <div style="height: 1000px; background: lightyellow;">Section 3</div>
            <div style="height: 1000px; background: lightcoral;">Section 4</div>
            <div style="height: 1000px; background: lightgray;">Section 5</div>
          </body></html>`,
        ),
    );

    // Scroll with large delta
    await page.scroll(640, 400, 0, 1000);

    // Wait for scroll to complete
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    // Should scroll significantly
    const scrollY = await page.evaluate(() => window.scrollY);
    expect(scrollY).toBeGreaterThan(500);
  });

  test("negative deltaY scrolls up", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 2000px;">
            <div style="height: 500px; background: lightblue;">Top</div>
            <div style="height: 500px; background: lightgreen;">Middle 1</div>
            <div style="height: 500px; background: lightyellow;">Middle 2</div>
            <div style="height: 500px; background: lightcoral;">Bottom</div>
          </body></html>`,
        ),
    );

    // First scroll down
    await page.scroll(640, 400, 0, 500);
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    let scrollY = await page.evaluate(() => window.scrollY);
    const scrolledDown = scrollY;
    expect(scrolledDown).toBeGreaterThan(0);

    // Now scroll up (negative delta)
    await page.scroll(640, 400, 0, -300);
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    scrollY = await page.evaluate(() => window.scrollY);
    expect(scrollY).toBeLessThan(scrolledDown);
  });

  test("scroll returns xpath when requested", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 2000px; margin: 0; padding: 0;">
            <div id="target" style="position: absolute; top: 0px; left: 400px; width: 300px; height: 100px; background: blue;">
              Target element
            </div>
            <p style="position: absolute; top: 200px; left: 0px;">Content below</p>
          </body></html>`,
        ),
    );

    // Scroll at coordinate (550, 50) which should be directly over the target div
    // div spans: left 400-700px, top 0-100px
    // coordinate 550,50 is within that range
    const xpath = await page.scroll(550, 50, 0, 200, { returnXpath: true });

    // Should return a non-empty xpath string for the element at that coordinate
    expect(typeof xpath).toBe("string");
    expect(xpath.length).toBeGreaterThan(0);
    // Xpath should reference the div or contain "target"
    expect(xpath.toLowerCase()).toMatch(/div|target/);
  });

  test("scroll without returnXpath returns empty string", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 2000px;">
            <div style="height: 500px; background: lightblue;">Content</div>
          </body></html>`,
        ),
    );

    // Scroll without returnXpath
    const result = await page.scroll(640, 400, 0, 200);

    // Should return empty string
    expect(result).toBe("");
  });

  test("multiple sequential scrolls accumulate", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          `<!doctype html><html><body style="height: 3000px;">
            <div style="height: 750px; background: lightblue;">Section 1</div>
            <div style="height: 750px; background: lightgreen;">Section 2</div>
            <div style="height: 750px; background: lightyellow;">Section 3</div>
            <div style="height: 750px; background: lightcoral;">Section 4</div>
          </body></html>`,
        ),
    );

    // First scroll
    await page.scroll(640, 400, 0, 200);
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    const after1 = await page.evaluate(() => window.scrollY);
    expect(after1).toBeGreaterThan(0);

    // Second scroll
    await page.scroll(640, 400, 0, 200);
    await page.evaluate(() => new Promise((r) => setTimeout(r, 200)));

    const after2 = await page.evaluate(() => window.scrollY);

    expect(after2).toBeGreaterThan(after1);
  });
});


================================================
FILE: packages/core/tests/integration/page-send-cdp.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

test.describe("Page sendCDP method", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
  });

  test("sends CDP commands and requires domain to be enabled first", async () => {
    const page = v3.context.pages()[0];
    await page.goto("https://example.com");

    // Try to add a virtual authenticator without enabling WebAuthn first
    // This should fail because the domain needs to be enabled
    await expect(
      page.sendCDP("WebAuthn.addVirtualAuthenticator", {
        options: {
          protocol: "ctap2",
          transport: "usb",
          hasResidentKey: false,
          hasUserVerification: false,
          isUserVerified: false,
        },
      }),
    ).rejects.toThrow();

    // Enable the WebAuthn domain
    await page.sendCDP("WebAuthn.enable");

    // Now adding a virtual authenticator should succeed
    const result = await page.sendCDP<{ authenticatorId: string }>(
      "WebAuthn.addVirtualAuthenticator",
      {
        options: {
          protocol: "ctap2",
          transport: "usb",
          hasResidentKey: false,
          hasUserVerification: false,
          isUserVerified: false,
        },
      },
    );

    // Verify we got an authenticator ID back
    expect(result).toHaveProperty("authenticatorId");
    expect(typeof result.authenticatorId).toBe("string");
    expect(result.authenticatorId.length).toBeGreaterThan(0);
  });
});


================================================
FILE: packages/core/tests/integration/perform-understudy-method.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { performUnderstudyMethod } from "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js";
import { closeV3 } from "./testUtils.js";

test.describe("tests performUnderstudyMethod", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("tests that clicking works", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/no-js-click/",
    );

    await performUnderstudyMethod(
      page,
      page.mainFrame(),
      "click",
      "/html/body/button",
      [],
      30000,
    );

    const isVisible = await page.locator("#success-msg").isVisible();
    expect(isVisible).toBe(true);
  });

  test("fill sets input value", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/login/",
    );

    await performUnderstudyMethod(
      page,
      page.mainFrame(),
      "fill",
      "/html/body/main/form/div[1]/input",
      ["Alice"],
      30000,
    );

    const textContent = await page
      .locator("/html/body/main/form/div[1]/input")
      .inputValue();
    expect(textContent).toBe("Alice");
  });

  test("tests that key presses work", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/key-press/",
    );

    await performUnderstudyMethod(
      page,
      page.mainFrame(),
      "press",
      "xpath=/html",
      ["Enter"],
      30000,
    );

    const textContent = await page
      .locator("/html/body/div/div/h1")
      .textContent();
    expect(textContent).toContain("Enter");
  });

  test("tests select option from a dropdown", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/nested-dropdown/",
    );

    await performUnderstudyMethod(
      page,
      page.mainFrame(),
      "selectOptionFromDropdown",
      "xpath=//*[@id='licenseType']",
      ["Smog Check Technician"],
      30000,
    );

    const inputValue = await page
      .locator("#licenseType >> option:checked")
      .textContent();
    expect(inputValue).toBe("Smog Check Technician");
  });

  test("tests drag & drop works (start xpath & end xpath)", async () => {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/drag-drop/",
    );

    await performUnderstudyMethod(
      page,
      page.mainFrame(),
      "dragAndDrop",
      "xpath=/html/body/div/section[1]/div[1]/div[1]", // start xpath
      ["/html/body/div/section[2]/div/div[1]"], // end xpath
      30000,
    );

    const droppedContent = await page
      .locator("/html/body/div/section[2]/div/div[1]/div")
      .textContent();
    expect(droppedContent).toBe("TEXT: Hello from text");
  });
});


================================================
FILE: packages/core/tests/integration/setinputfiles.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { Buffer } from "buffer";
import { promises as fs } from "fs";
import path from "path";
import crypto from "crypto";
import type { Page as V3Page } from "../../lib/v3/understudy/page.js";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";

const FILE_UPLOAD_IFRAME_URL =
  "https://browserbase.github.io/stagehand-eval-sites/sites/file-uploads-iframe/";
const FILE_UPLOAD_V2_URL =
  "https://browserbase.github.io/stagehand-eval-sites/sites/file-uploads-2/";

const RESUME_INPUT = "#resumeUpload";
const RESUME_SUCCESS = "#resumeSuccess";
const IMAGES_INPUT = "#imagesUpload";
const IMAGES_SUCCESS = "#imagesSuccess";
const AUDIO_INPUT = "#audioUpload";
const AUDIO_SUCCESS = "#audioSuccess";
const IFRAME_UPLOAD_INPUT = "/html/body/div/iframe/html/body/div/div[1]/input";
const IFRAME_SUCCESS =
  "body > div > iframe >> html > body > div > div:nth-of-type(2)";

test.describe("tests setInputFiles()", () => {
  let v3: V3;
  const fixtures: string[] = [];

  test.beforeEach(async () => {
    v3 = new V3(v3TestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
    await Promise.all(
      fixtures.splice(0).map((file) => fs.unlink(file).catch(() => {})),
    );
  });

  const createFixture = async (
    namePrefix: string,
    contents: string,
    ext = ".txt",
  ): Promise<string> => {
    const normalizedExt = ext.startsWith(".") ? ext : `.${ext}`;
    const filename = `${namePrefix}-${crypto.randomBytes(4).toString("hex")}${normalizedExt}`;
    const filePath = path.resolve(process.cwd(), filename);
    await fs.writeFile(filePath, contents, "utf-8");
    fixtures.push(filePath);
    return filePath;
  };

  const expectUploadSuccess = async (
    page: V3Page,
    successSelector: string,
    expectedText: string,
  ) => {
    await expect
      .poll(
        () =>
          page.evaluate((selector) => {
            const el = document.querySelector(selector);
            if (!el) return "";
            const display = window.getComputedStyle(el).display;
            if (display === "none") return "";
            return el.textContent ?? "";
          }, successSelector),
        { message: `wait for success message at ${successSelector}` },
      )
      .toContain(expectedText);
  };

  const getInputFileCount = async (page: V3Page, inputSelector: string) => {
    return await page.evaluate((selector) => {
      const el = document.querySelector(selector);
      if (!(el instanceof HTMLInputElement)) return 0;
      return el.files?.length ?? 0;
    }, inputSelector);
  };

  const expectFileCount = async (
    page: V3Page,
    inputSelector: string,
    expected: number,
  ) => {
    await expect
      .poll(() => getInputFileCount(page, inputSelector), {
        message: `wait for file count on ${inputSelector}`,
      })
      .toBe(expected);
  };

  test("deepLocator uploads and validates within iframe", async () => {
    const page = v3.context.pages()[0];
    await page.goto(FILE_UPLOAD_IFRAME_URL);
    const fixture = await createFixture(
      "iframe-upload",
      "<p>iframe upload</p>",
      ".txt",
    );
    await page
      .deepLocator(IFRAME_UPLOAD_INPUT)
      .setInputFiles(path.relative(process.cwd(), fixture));

    const successLocator = page.deepLocator(IFRAME_SUCCESS);
    await expect
      .poll(async () => (await successLocator.textContent()) ?? "", {
        message: "wait for iframe upload success",
      })
      .toContain("file uploaded successfully");
  });

  test("locator uploads resume via relative path string", async () => {
    const page = v3.context.pages()[0];
    await page.goto(FILE_UPLOAD_V2_URL);
    const fixture = await createFixture("resume", "<p>resume</p>", ".pdf");
    await page
      .locator(RESUME_INPUT)
      .setInputFiles(path.relative(process.cwd(), fixture));
    await expectUploadSuccess(page, RESUME_SUCCESS, "Resume uploaded!");
    await expectFileCount(page, RESUME_INPUT, 1);
  });

  test("locator uploads multiple images via absolute paths", async () => {
    const page = v3.context.pages()[0];
    await page.goto(FILE_UPLOAD_V2_URL);
    const first = await createFixture("image-a", "<p>A</p>", ".png");
    const second = await createFixture("image-b", "<p>B</p>", ".jpeg");
    await page.locator(IMAGES_INPUT).setInputFiles([first, second]);
    await expectUploadSuccess(page, IMAGES_SUCCESS, "Images uploaded!");
    await expectFileCount(page, IMAGES_INPUT, 2);
  });

  test("locator uploads audio via payload object", async () => {
    const page = v3.context.pages()[0];
    await page.goto(FILE_UPLOAD_V2_URL);
    await page.locator(AUDIO_INPUT).setInputFiles({
      name: "voice-sample.mp3",
      mimeType: "audio/mpeg",
      buffer: Buffer.from("fake audio bytes", "utf-8"),
    });
    await expectUploadSuccess(page, AUDIO_SUCCESS, "Audio file uploaded!");
    await expectFileCount(page, AUDIO_INPUT, 1);
  });

  test("locator uploads multiple payload objects to images input", async () => {
    const page = v3.context.pages()[0];
    await page.goto(FILE_UPLOAD_V2_URL);
    await page.locator(IMAGES_INPUT).setInputFiles([
      {
        name: "payload-a.png",
        mimeType: "image/png",
        buffer: Buffer.from("payload-a", "utf-8"),
      },
      {
        name: "payload-b.png",
        mimeType: "image/png",
        buffer: Buffer.from("payload-b", "utf-8"),
      },
    ]);
    await expectUploadSuccess(page, IMAGES_SUCCESS, "Images uploaded!");
    await expectFileCount(page, IMAGES_INPUT, 2);
  });
});


================================================
FILE: packages/core/tests/integration/shadow-iframe-oopif.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import puppeteer from "puppeteer-core";
import { chromium as playwrightChromium } from "playwright-core";
import { chromium as patchrightChromium } from "patchright-core";
import { Action } from "../../lib/v3/types/public/methods.js";
import { AnyPage } from "../../lib/v3/types/public/page.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

/**
 * IMPORTANT:
 * - We create a single V3 instance/test to avoid cross-test state. Increase parallelism later if needed.
 * - We assert an *effect* when feasible (e.g. input value). For pure clicks we assert no thrown error.
 */

type Case = {
  title: string;
  url: string;
  action: Action;
  expectedSubstrings: string[]; // check v3.extract().pageText contains these
};

type Framework = "v3" | "puppeteer" | "playwright" | "patchright";

async function runCase(v3: V3, c: Case, framework: Framework): Promise<void> {
  let cleanup: (() => Promise<void> | void) | null = null;

  // Acquire the correct page for the requested framework
  let page: AnyPage | undefined;
  switch (framework) {
    case "v3": {
      const v3Page = v3.context.pages()[0];
      await v3Page.goto(c.url, { waitUntil: "networkidle" });
      page = v3Page;
      break;
    }
    case "puppeteer": {
      const browser = await puppeteer.connect({
        browserWSEndpoint: v3.connectURL(),
        defaultViewport: null,
      });
      const pages = await browser.pages();
      const puppeteerPage = pages[0];
      await puppeteerPage.goto(c.url, { waitUntil: "networkidle0" });
      page = puppeteerPage;
      cleanup = async () => {
        try {
          await browser.close();
        } catch {
          //
        }
      };
      break;
    }
    case "playwright": {
      const pwBrowser = await playwrightChromium.connectOverCDP(
        v3.connectURL(),
      );
      const pwContext = pwBrowser.contexts()[0];
      const pwPage = pwContext.pages()[0];
      await pwPage.goto(c.url, { waitUntil: "networkidle" as never });
      page = pwPage as unknown as AnyPage;
      cleanup = async () => {
        try {
          await pwBrowser.close();
        } catch {
          // ignore
        }
      };
      break;
    }
    case "patchright": {
      const prBrowser = await patchrightChromium.connectOverCDP(
        v3.connectURL(),
      );
      const prContext = prBrowser.contexts()[0];
      const prPage = prContext.pages()[0];
      await prPage.goto(c.url, { waitUntil: "networkidle" as never });
      page = prPage as unknown as AnyPage;
      cleanup = async () => {
        try {
          await prBrowser.close();
        } catch {
          // ignore
        }
      };
      break;
    }
  }

  try {
    if (!page) throw new Error("Missing page for selected framework");
    await v3.act(c.action, { page });
    // Post-action extraction; verify expected text appears
    const extraction = await v3.extract({ page });
    const text = extraction.pageText ?? "";
    for (const s of c.expectedSubstrings) {
      expect(
        text.includes(s),
        `expected pageText to include substring: ${s}`,
      ).toBeTruthy();
    }
  } finally {
    await cleanup?.();
  }
}

const cases: Case[] = [
  {
    title: "Closed shadow root inside OOPIF",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/closed-shadow-root-in-oopif/",
    action: {
      selector:
        "xpath=/html/body/main/section/iframe/html/body/shadow-demo//div/button",
      method: "click",
      arguments: [""],
      description: "click button inside closed shadow root in OOPIF",
    },
    expectedSubstrings: ["button successfully clicked"],
  },
  {
    title: "Open shadow root inside OOPIF",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/open-shadow-root-in-oopif/",
    action: {
      selector:
        "xpath=/html/body/main/section/iframe/html/body/shadow-demo//div/button",
      method: "click",
      arguments: [""],
      description: "",
    },
    expectedSubstrings: ["button successfully clicked"],
  },
  {
    title: "OOPIF inside open shadow root",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-open-shadow-dom/",
    action: {
      selector:
        "xpath=/html/body/shadow-host//section/iframe/html/body/main/section[1]/form/div/div[1]/input",
      method: "fill",
      arguments: ["nunya"],
      description: "",
    },
    expectedSubstrings: ["nunya"],
  },
  {
    title: "OOPIF inside closed shadow root",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-closed-shadow-dom/",
    action: {
      selector:
        "xpath=/html/body/shadow-host//section/iframe/html/body/main/section[1]/form/div/div[1]/input",
      method: "fill",
      arguments: ["nunya"],
      description: "fill input inside OOPIF",
    },
    expectedSubstrings: ["nunya"],
  },
];

test.describe
  .parallel("Stagehand v3: shadow <-> iframe OOPIF scenarios", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  const frameworks: Framework[] = [
    "v3",
    "playwright",
    "puppeteer",
    "patchright",
  ];
  for (const fw of frameworks) {
    for (const c of cases) {
      test(`[${fw}] ${c.title}`, async () => {
        await runCase(v3, c, fw);
      });
    }
  }
});


================================================
FILE: packages/core/tests/integration/shadow-iframe-spif.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import puppeteer from "puppeteer-core";
import { chromium as playwrightChromium } from "playwright-core";
import { chromium as patchrightChromium } from "patchright-core";
import { Action } from "../../lib/v3/types/public/methods.js";
import { AnyPage } from "../../lib/v3/types/public/page.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

/**
 * IMPORTANT:
 * - We create a single V3 instance/test to avoid cross-test state. Increase parallelism later if needed.
 * - We assert an *effect* when feasible (e.g. input value). For pure clicks we assert no thrown error.
 */

type Case = {
  title: string;
  url: string;
  action: Action;
  expectedSubstrings: string[]; // check v3.extract().pageText contains these
};

type Framework = "v3" | "puppeteer" | "playwright" | "patchright";

async function runCase(v3: V3, c: Case, framework: Framework): Promise<void> {
  let cleanup: (() => Promise<void> | void) | null = null;

  // Acquire the correct page for the requested framework
  let page: AnyPage | undefined;
  switch (framework) {
    case "v3": {
      const v3Page = v3.context.pages()[0];
      await v3Page.goto(c.url, { waitUntil: "networkidle" });
      page = v3Page;
      break;
    }
    case "puppeteer": {
      const browser = await puppeteer.connect({
        browserWSEndpoint: v3.connectURL(),
        defaultViewport: null,
      });
      const pages = await browser.pages();
      const puppeteerPage = pages[0];
      await puppeteerPage.goto(c.url, { waitUntil: "networkidle0" });
      page = puppeteerPage;
      cleanup = async () => {
        try {
          await browser.close();
        } catch {
          //
        }
      };
      break;
    }
    case "playwright": {
      const pwBrowser = await playwrightChromium.connectOverCDP(
        v3.connectURL(),
      );
      const pwContext = pwBrowser.contexts()[0];
      const pwPage = pwContext.pages()[0];
      await pwPage.goto(c.url, { waitUntil: "networkidle" as never });
      page = pwPage as unknown as AnyPage;
      cleanup = async () => {
        try {
          await pwBrowser.close();
        } catch {
          // ignore
        }
      };
      break;
    }
    case "patchright": {
      const prBrowser = await patchrightChromium.connectOverCDP(
        v3.connectURL(),
      );
      const prContext = prBrowser.contexts()[0];
      const prPage = prContext.pages()[0];
      await prPage.goto(c.url, { waitUntil: "networkidle" as never });
      page = prPage as unknown as AnyPage;
      cleanup = async () => {
        try {
          await prBrowser.close();
        } catch {
          // ignore
        }
      };
      break;
    }
  }

  try {
    if (!page) throw new Error("Missing page for selected framework");
    await v3.act(c.action, { page });
    // Post-action extraction; verify expected text appears
    const extraction = await v3.extract({ page });
    const text = extraction.pageText ?? "";
    for (const s of c.expectedSubstrings) {
      expect(
        text.includes(s),
        `expected pageText to include substring: ${s}`,
      ).toBeTruthy();
    }
  } finally {
    await cleanup?.();
  }
}

const cases: Case[] = [
  {
    title: "Open shadow root inside SPIF",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/open-shadow-root-in-spif/",
    action: {
      selector:
        "xpath=/html/body/main/section/iframe/html/body/shadow-demo//div/button",
      method: "click",
      arguments: [""],
      description: "",
    },
    expectedSubstrings: ["button successfully clicked"],
  },
  {
    title: "Closed shadow root inside SPIF",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/closed-shadow-dom-in-spif/",
    action: {
      selector: "xpath=/html/body/div/iframe/html/body/shadow-demo//div/button",
      method: "click",
      arguments: [""],
      description: "",
    },
    expectedSubstrings: ["button successfully clicked"],
  },
  {
    title: "SPIF inside closed shadow root",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-closed-shadow-dom/",
    action: {
      selector: "xpath=/html/body/shadow-host//div/iframe/html/body/button",
      method: "click",
      arguments: [""],
      description: "",
    },
    expectedSubstrings: ["button successfully clicked"],
  },
  {
    title: "SPIF inside open shadow root",
    url: "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-open-shadow-dom/",
    action: {
      selector: "xpath=/html/body/shadow-host//div/iframe/html/body/button",
      method: "click",
      arguments: [""],
      description: "click button inside SPIF under open shadow",
    },
    expectedSubstrings: ["button successfully clicked"],
  },
];

test.describe.parallel("Stagehand v3: shadow <-> iframe SPIF scenarios", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  const frameworks: Framework[] = [
    "v3",
    "playwright",
    "puppeteer",
    "patchright",
  ];
  for (const fw of frameworks) {
    for (const c of cases) {
      test(`[${fw}] ${c.title}`, async () => {
        await runCase(v3, c, fw);
      });
    }
  }
});


================================================
FILE: packages/core/tests/integration/testUtils.ts
================================================
import type { V3 } from "../../lib/v3/v3.js";
import type {
  LanguageModelV2,
  LanguageModelV2CallOptions,
  LanguageModelV2Content,
  LanguageModelV2FinishReason,
  LanguageModelV2Usage,
} from "@ai-sdk/provider";
import { AISdkClient } from "../../lib/v3/llm/aisdk.js";

/**
 * Races a promise against a timeout.
 * Resolves to the promise value or "timeout" if the deadline expires.
 */
export function raceTimeout<T>(
  promise: Promise<T>,
  ms: number,
): Promise<T | "timeout"> {
  let timer: ReturnType<typeof setTimeout>;
  const timeout = new Promise<"timeout">((resolve) => {
    timer = setTimeout(() => resolve("timeout"), ms);
  });
  return Promise.race([promise, timeout]).finally(() => clearTimeout(timer));
}

const CLOSE_TIMEOUT_MS = 5_000;

async function settleWithTimeout(
  promise: Promise<unknown>,
  timeoutMs: number,
): Promise<void> {
  let timeoutId: NodeJS.Timeout | undefined;
  const timeout = new Promise<void>((resolve) => {
    timeoutId = setTimeout(resolve, timeoutMs);
  });
  try {
    await Promise.race([promise.catch(() => {}), timeout]);
  } finally {
    if (timeoutId) clearTimeout(timeoutId);
  }
}

export async function closeV3(v3?: V3 | null): Promise<void> {
  if (!v3) return;
  const isBrowserbase = v3.isBrowserbase;
  if (isBrowserbase) {
    try {
      await settleWithTimeout(
        v3.context.conn.send("Browser.close"),
        CLOSE_TIMEOUT_MS,
      );
    } catch {
      // best-effort cleanup
    }
  }

  await settleWithTimeout(v3.close(), CLOSE_TIMEOUT_MS);
}

type JsonResponseKey =
  | "act"
  | "Observation"
  | "Metadata"
  | "Extraction"
  | "default";

type JsonResponseValue =
  | Record<string, unknown>
  | ((options: LanguageModelV2CallOptions) => Record<string, unknown>);

type JsonResponseScript = JsonResponseValue | JsonResponseValue[];

type GenerateResponseValue =
  | {
      content: LanguageModelV2Content[];
      finishReason?: LanguageModelV2FinishReason;
      usage?: Partial<LanguageModelV2Usage>;
    }
  | ((options: LanguageModelV2CallOptions) => {
      content: LanguageModelV2Content[];
      finishReason?: LanguageModelV2FinishReason;
      usage?: Partial<LanguageModelV2Usage>;
    });

type ScriptedLanguageModel = LanguageModelV2 & {
  doGenerateCalls: LanguageModelV2CallOptions[];
};

type ScriptedGenerateResult = {
  content: LanguageModelV2Content[];
  finishReason?: LanguageModelV2FinishReason;
  usage?: Partial<LanguageModelV2Usage>;
};

const DEFAULT_USAGE: LanguageModelV2Usage = {
  inputTokens: 1,
  outputTokens: 1,
  totalTokens: 2,
  reasoningTokens: 0,
  cachedInputTokens: 0,
};

const mergeUsage = (
  usage?: Partial<LanguageModelV2Usage>,
): LanguageModelV2Usage => ({
  ...DEFAULT_USAGE,
  ...(usage ?? {}),
});

function consumeScriptValue<T>(value: T | T[] | undefined, fallback: T): T {
  if (!Array.isArray(value)) {
    return value ?? fallback;
  }

  if (value.length <= 1) {
    return value[0] ?? fallback;
  }

  return value.shift() ?? fallback;
}

function resolveJsonResponseKey(
  options: LanguageModelV2CallOptions,
): JsonResponseKey {
  const responseFormat = options.responseFormat;
  if (!responseFormat || responseFormat.type !== "json") {
    return "default";
  }

  const schema = responseFormat.schema as {
    type?: string;
    properties?: Record<string, unknown>;
  };
  const properties = schema?.properties ?? {};

  if ("elementId" in properties && "twoStep" in properties) {
    return "act";
  }

  if ("elements" in properties) {
    return "Observation";
  }

  if ("completed" in properties && "progress" in properties) {
    return "Metadata";
  }

  return "Extraction";
}

export function promptToText(
  prompt: LanguageModelV2CallOptions["prompt"],
): string {
  return (prompt ?? [])
    .flatMap((message) => {
      if (typeof message.content === "string") {
        return [message.content];
      }

      return (message.content ?? [])
        .map((part) => (part.type === "text" ? part.text : ""))
        .filter((text): text is string => text.length > 0);
    })
    .join("\n");
}

function findEncodedIds(options: LanguageModelV2CallOptions): string[] {
  return [...promptToText(options.prompt).matchAll(/\b\d+-\d+\b/g)].map(
    (match) => match[0],
  );
}

export function findEncodedIdForText(
  options: LanguageModelV2CallOptions,
  text: string,
): string {
  const promptText = promptToText(options.prompt);
  const lines = promptText.split("\n");
  const line = lines.find((entry) => entry.includes(text));
  const match = line?.match(/\b\d+-\d+\b/);

  if (!match) {
    throw new Error(`Could not find encoded id for text: ${text}`);
  }

  return match[0];
}

export function findLastEncodedId(options: LanguageModelV2CallOptions): string {
  const matches = findEncodedIds(options);
  if (matches.length === 0) {
    throw new Error("Could not find any encoded ids in the prompt.");
  }

  return matches[matches.length - 1];
}

export function toolCallResponse(
  toolName: string,
  input: Record<string, unknown>,
  toolCallId = `${toolName}-1`,
): {
  content: LanguageModelV2Content[];
  finishReason: LanguageModelV2FinishReason;
  usage: LanguageModelV2Usage;
} {
  return {
    content: [
      {
        type: "tool-call",
        toolCallId,
        toolName,
        input: JSON.stringify(input),
      },
    ],
    finishReason: "tool-calls",
    usage: DEFAULT_USAGE,
  };
}

export function doneToolResponse(
  reasoning = "done",
  taskComplete = true,
  toolCallId = "done-1",
): {
  content: LanguageModelV2Content[];
  finishReason: LanguageModelV2FinishReason;
  usage: LanguageModelV2Usage;
} {
  return toolCallResponse("done", { reasoning, taskComplete }, toolCallId);
}

function createGenerateResult(result: ScriptedGenerateResult): {
  content: LanguageModelV2Content[];
  finishReason: LanguageModelV2FinishReason;
  usage: LanguageModelV2Usage;
  warnings: [];
} {
  return {
    content: result.content,
    finishReason: result.finishReason ?? "stop",
    usage: mergeUsage(result.usage),
    warnings: [],
  };
}

export function createScriptedAisdkTestLlmClient(options?: {
  modelId?: string;
  jsonResponses?: Partial<Record<JsonResponseKey, JsonResponseScript>>;
  generateResponses?: GenerateResponseValue[];
}): AISdkClient {
  const jsonResponses = Object.fromEntries(
    Object.entries(options?.jsonResponses ?? {}).map(([key, value]) => [
      key,
      Array.isArray(value) ? [...value] : value,
    ]),
  ) as Partial<Record<JsonResponseKey, JsonResponseScript>>;
  const generateResponses = [...(options?.generateResponses ?? [])];

  const model: ScriptedLanguageModel = {
    provider: "mock",
    modelId: options?.modelId ?? "mock/stagehand-flow-logger",
    specificationVersion: "v2",
    supportedUrls: {},
    doGenerateCalls: [],
    doGenerate: async (callOptions) => {
      model.doGenerateCalls.push(callOptions);

      if (callOptions.responseFormat?.type === "json") {
        const key = resolveJsonResponseKey(callOptions);
        const responseScripts = consumeScriptValue<
          JsonResponseScript | undefined
        >(jsonResponses[key], jsonResponses.default);
        const responseScript = consumeScriptValue<
          JsonResponseValue | undefined
        >(responseScripts, undefined);
        const response =
          typeof responseScript === "function"
            ? responseScript(callOptions)
            : (responseScript ?? {});

        return createGenerateResult({
          content: [{ type: "text", text: JSON.stringify(response) }],
        });
      }

      const responseScript = consumeScriptValue<
        GenerateResponseValue | undefined
      >(generateResponses, undefined);

      if (!responseScript) {
        return createGenerateResult({
          content: [{ type: "text", text: "done" }],
        });
      }

      const response =
        typeof responseScript === "function"
          ? responseScript(callOptions)
          : responseScript;

      return createGenerateResult(response);
    },
    doStream: async () => {
      throw new Error("Streaming is not implemented for this test model.");
    },
  };

  return new AISdkClient({ model });
}


================================================
FILE: packages/core/tests/integration/text-selector-innermost.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { Protocol } from "devtools-protocol";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe("Text selector innermost element matching", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("text selector matches only innermost elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <div id="outer">
          <span id="middle">
            <button id="inner">Click me</button>
          </span>
        </div>
      `),
    );

    // Only the button should be counted, not the parent elements
    const count = await page.mainFrame().locator("text=Click me").count();
    expect(count).toBe(1);

    // Verify it finds the button element specifically
    const session = page.mainFrame().session;
    const { executionContextId } = await session.send<{
      executionContextId: number;
    }>("Page.createIsolatedWorld", {
      frameId: page.mainFrame().frameId,
      worldName: "test-world",
    });

    const evalRes = await session.send<Protocol.Runtime.EvaluateResponse>(
      "Runtime.evaluate",
      {
        expression: `(() => {
          const candidates = [];
          const iter = document.createNodeIterator(document.documentElement, NodeFilter.SHOW_ELEMENT);
          let n;
          while ((n = iter.nextNode())) {
            const el = n;
            const t = (el.innerText ?? el.textContent ?? '').trim();
            if (t && t.includes("Click me")) {
              candidates.push(el);
            }
          }
          
          // Find innermost
          for (const candidate of candidates) {
            let isInnermost = true;
            for (const other of candidates) {
              if (candidate !== other && candidate.contains(other)) {
                isInnermost = false;
                break;
              }
            }
            if (isInnermost) return candidate.id;
          }
          return null;
        })()`,
        contextId: executionContextId,
        returnByValue: true,
      },
    );

    expect(evalRes.result.value).toBe("inner");
  });

  test("multiple innermost elements with same text", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <div>
          <button>Submit</button>
          <span>Some other content</span>
          <button>Submit</button>
        </div>
        <div>
          <a href="#">Submit</a>
        </div>
      `),
    );

    // Should find all three innermost elements (2 buttons + 1 link)
    const count = await page.mainFrame().locator("text=Submit").count();
    expect(count).toBe(3);
  });

  test("nested text with different innermost elements", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(`
        <div id="parent">
          Hello <span id="child">World</span>
        </div>
      `),
    );

    // "Hello" is only in the parent div
    const helloCount = await page.mainFrame().locator("text=Hello").count();
    expect(helloCount).toBe(1); // Only the div

    // "World" is only in the span
    const worldCount = await page.mainFrame().locator("text=World").count();
    expect(worldCount).toBe(1); // Only the span

    // "Hello World" matches only the parent div (as it's the innermost containing both words)
    const bothCount = await page
      .mainFrame()
      .locator("text=Hello World")
      .count();
    expect(bothCount).toBe(1); // Only the div
  });
});


================================================
FILE: packages/core/tests/integration/timeouts.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { z } from "zod";
import { closeV3 } from "./testUtils.js";
import type { LLMClient } from "../../lib/v3/llm/LLMClient.js";
import { generateText } from "ai";

type AgentToolNameWithTimeout =
  | "act"
  | "extract"
  | "fillForm"
  | "ariaTree"
  | "click"
  | "type"
  | "dragAndDrop"
  | "clickAndHold"
  | "fillFormVision"
  | "goto"
  | "navback"
  | "screenshot"
  | "scroll"
  | "keys";

type ToolTimeoutTestModel = {
  provider: string;
  modelId: string;
  specificationVersion: "v2";
  supportedUrls: Record<string, RegExp[]>;
  doGenerate: () => Promise<{
    content: Array<{
      type: "tool-call";
      toolCallId: string;
      toolName: string;
      input: string;
    }>;
    finishReason: "tool-calls";
    usage: { inputTokens: number; outputTokens: number; totalTokens: number };
    warnings: [];
  }>;
  doStream: (_options: unknown) => Promise<never>;
};

type ToolTimeoutTestLLMClient = LLMClient & {
  model: ToolTimeoutTestModel;
};

function createToolTimeoutTestLlmClient(
  toolName: AgentToolNameWithTimeout,
  toolInput: Record<string, unknown>,
): ToolTimeoutTestLLMClient {
  const usage = {
    prompt_tokens: 0,
    completion_tokens: 0,
    reasoning_tokens: 0,
    cached_input_tokens: 0,
    total_tokens: 0,
  };
  let generateCallCount = 0;

  const model: ToolTimeoutTestModel = {
    provider: "mock",
    modelId: "mock/tool-timeout-test",
    specificationVersion: "v2",
    supportedUrls: {},
    doGenerate: async () => {
      generateCallCount += 1;
      if (generateCallCount === 1) {
        return {
          content: [
            {
              type: "tool-call",
              toolCallId: "tool-1",
              toolName,
              input: JSON.stringify(toolInput),
            },
          ],
          finishReason: "tool-calls",
          usage: { inputTokens: 0, outputTokens: 0, totalTokens: 0 },
          warnings: [],
        };
      }

      return {
        content: [
          {
            type: "tool-call",
            toolCallId: "done-1",
            toolName: "done",
            input: JSON.stringify({ reasoning: "done", taskComplete: true }),
          },
        ],
        finishReason: "tool-calls",
        usage: { inputTokens: 0, outputTokens: 0, totalTokens: 0 },
        warnings: [],
      };
    },
    doStream: async () => {
      throw new Error("doStream not implemented in timeout test model");
    },
  };

  const llm = {
    type: "openai",
    modelName: "openai/gpt-4.1-mini",
    hasVision: false,
    clientOptions: {},
    model,
    getLanguageModel: () => model,
    generateText,
    createChatCompletion: async <T = unknown>(options: unknown): Promise<T> => {
      const responseModelName = (
        options as { options?: { response_model?: { name?: string } } }
      )?.options?.response_model?.name;

      if (responseModelName === "act") {
        return {
          data: {
            elementId: "1-0",
            description: "click body",
            method: "click",
            arguments: [],
            twoStep: false,
          },
          usage,
        } as T;
      }
      if (responseModelName === "Observation") {
        return { data: { elements: [] }, usage } as T;
      }
      if (responseModelName === "Extraction") {
        return { data: {}, usage } as T;
      }
      if (responseModelName === "Metadata") {
        return { data: { completed: true, progress: "" }, usage } as T;
      }
      return { data: {}, usage } as T;
    },
  };

  return llm as unknown as ToolTimeoutTestLLMClient;
}

function findToolOutput(
  stepEvents: Array<{
    toolCalls?: Array<{ toolName?: string }>;
    toolResults?: Array<{ output?: unknown }>;
  }>,
  toolName: string,
) {
  for (const event of stepEvents) {
    if (!event.toolCalls || !event.toolResults) continue;
    const toolIndex = event.toolCalls.findIndex(
      (tc) => tc.toolName === toolName,
    );
    if (toolIndex !== -1) {
      return event.toolResults[toolIndex]?.output;
    }
  }
  return undefined;
}

async function runAgentToolTimeoutScenario(
  toolName: AgentToolNameWithTimeout,
  toolInput: Record<string, unknown>,
  options?: { mode?: "dom" | "hybrid" },
) {
  const llmClient = createToolTimeoutTestLlmClient(toolName, toolInput);
  const stepEvents: Array<{
    toolCalls?: Array<{ toolName?: string }>;
    toolResults?: Array<{ output?: unknown }>;
  }> = [];
  const v3 = new V3({
    ...v3DynamicTestConfig,
    experimental: true,
    llmClient,
  });
  await v3.init();
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://example.com");
    const agent = v3.agent({
      ...(options?.mode ? { mode: options.mode } : {}),
    });
    await agent.execute({
      instruction: `Use ${toolName} and then finish`,
      maxSteps: 2,
      toolTimeout: 1,
      callbacks: {
        onStepFinish: (event) => {
          stepEvents.push({
            toolCalls: event.toolCalls?.map((tc) => ({
              toolName: tc.toolName,
            })),
            toolResults: event.toolResults?.map((tr) => ({
              output: tr.output,
            })),
          });
        },
      },
    });
    const toolOutput = findToolOutput(stepEvents, toolName);
    if (!toolOutput) {
      throw new Error(`No tool output captured for ${toolName}`);
    }
    return { toolOutput };
  } finally {
    await closeV3(v3);
  }
}

test.describe("V3 hard timeouts", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("observe() enforces timeoutMs", async () => {
    // Tiny timeout to force the race to hit the timeout branch
    await expect(v3.observe("find something", { timeout: 5 })).rejects.toThrow(
      /timed out/i,
    );
  });

  test("extract() enforces timeoutMs", async () => {
    const schema = z.object({ title: z.string().optional() });
    await expect(
      v3.extract("Extract title", schema, { timeout: 5 }),
    ).rejects.toThrow(/timed out/i);
  });

  test("act() enforces timeoutMs", async () => {
    await expect(v3.act("do nothing", { timeout: 5 })).rejects.toThrow(
      /timed out/i,
    );
  });

  test("agent toolTimeout enforces timeout for act tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("act", {
      action: "click somewhere",
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for extract tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("extract", {
      instruction: "extract the page title",
      schema: { type: "object", properties: { title: { type: "string" } } },
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for fillForm tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("fillForm", {
      fields: [{ action: "type hello into name" }],
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for ariaTree", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("ariaTree", {});
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for goto tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("goto", {
      url: "https://example.com/slow",
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for navback tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("navback", {
      reasoningText: "going back",
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for screenshot tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("screenshot", {});
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for scroll tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("scroll", {
      direction: "down",
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for keys tool", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario("keys", {
      method: "press",
      value: "Enter",
    });
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for click tool (hybrid)", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario(
      "click",
      { describe: "click element", coordinates: [100, 100] },
      { mode: "hybrid" },
    );
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for type tool (hybrid)", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario(
      "type",
      {
        describe: "type into field",
        text: "hello",
        coordinates: [100, 100],
      },
      { mode: "hybrid" },
    );
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for dragAndDrop tool (hybrid)", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario(
      "dragAndDrop",
      {
        describe: "drag element",
        startCoordinates: [100, 100],
        endCoordinates: [200, 200],
      },
      { mode: "hybrid" },
    );
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for clickAndHold tool (hybrid)", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario(
      "clickAndHold",
      {
        describe: "hold element",
        coordinates: [100, 100],
        duration: 1000,
      },
      { mode: "hybrid" },
    );
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });

  test("agent toolTimeout enforces timeout for fillFormVision tool (hybrid)", async () => {
    const { toolOutput } = await runAgentToolTimeoutScenario(
      "fillFormVision",
      {
        fields: [
          {
            action: "type hello into name",
            value: "hello",
            coordinates: { x: 100, y: 100 },
          },
          {
            action: "type world into email",
            value: "world",
            coordinates: { x: 100, y: 200 },
          },
        ],
      },
      { mode: "hybrid" },
    );
    const output = toolOutput as { success: boolean; error: string };
    expect(output.success).toBe(false);
    expect(output.error).toContain("TimeoutError");
    expect(output.error).toContain("1ms");
  });
});


================================================
FILE: packages/core/tests/integration/user-data-dir.spec.ts
================================================
import { test, expect } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3TestConfig } from "./v3.config.js";
import * as fs from "fs";
import * as path from "path";
import * as os from "os";

test.describe("userDataDir persistence", () => {
  let v3: V3;
  let testDir: string;

  test.beforeEach(() => {
    testDir = fs.mkdtempSync(
      path.join(os.tmpdir(), "stagehand-userdata-test-"),
    );
  });

  test.afterEach(async () => {
    await v3?.close?.().catch(() => {});
    if (testDir && fs.existsSync(testDir)) {
      fs.rmSync(testDir, { recursive: true, force: true });
    }
  });

  test("Chrome uses the specified userDataDir", async () => {
    const browserTarget = (
      process.env.STAGEHAND_BROWSER_TARGET ?? "local"
    ).toLowerCase();
    const isBrowserbase = browserTarget === "browserbase";
    test.skip(isBrowserbase, "Requires local Chromium for userDataDir checks");

    v3 = new V3({
      ...v3TestConfig,
      localBrowserLaunchOptions: {
        ...(v3TestConfig.localBrowserLaunchOptions ?? {}),
        userDataDir: testDir,
        preserveUserDataDir: true,
      },
    });

    await v3.init();

    const page = v3.context.pages()[0];
    await page.goto("about:blank");

    await expect
      .poll(() => fs.existsSync(path.join(testDir, "Default")), {
        timeout: 10_000,
      })
      .toBe(true);

    expect(fs.existsSync(path.join(testDir, "Local State"))).toBe(true);
  });
});


================================================
FILE: packages/core/tests/integration/v3.config.ts
================================================
import type { V3Options } from "../../lib/v3/types/public/options.js";
import {
  v3DynamicTestConfig,
  getV3DynamicTestConfig,
} from "./v3.dynamic.config.js";

export const v3TestConfig: V3Options = v3DynamicTestConfig;

export function getV3TestConfig(overrides: Partial<V3Options> = {}): V3Options {
  return getV3DynamicTestConfig(overrides);
}

export default getV3TestConfig;


================================================
FILE: packages/core/tests/integration/v3.dynamic.config.ts
================================================
import type { V3Options } from "../../lib/v3/types/public/options.js";
import type { BrowserbaseSessionCreateParams } from "../../lib/v3/types/public/api.js";
import type { LogLine } from "../../lib/v3/types/public/logs.js";

const browserTarget = (
  process.env.STAGEHAND_BROWSER_TARGET ?? "local"
).toLowerCase();
const isBrowserbase = browserTarget === "browserbase";
const browserbaseRegionRaw = process.env.BROWSERBASE_REGION;
const browserbaseRegion = (
  [
    "us-west-2",
    "us-east-1",
    "eu-central-1",
    "ap-southeast-1",
  ] as BrowserbaseSessionCreateParams["region"][]
).includes(browserbaseRegionRaw as BrowserbaseSessionCreateParams["region"])
  ? (browserbaseRegionRaw as BrowserbaseSessionCreateParams["region"])
  : undefined;

const baseConfig = {
  verbose: 0 as const,
  disablePino: true,
  logger: (line: LogLine) => console.log(line),
  disableAPI: true,
};

export const v3DynamicTestConfig: V3Options = isBrowserbase
  ? {
      ...baseConfig,
      env: "BROWSERBASE",
      apiKey: process.env.BROWSERBASE_API_KEY!,
      projectId: process.env.BROWSERBASE_PROJECT_ID!,
      disableAPI: true,
      selfHeal: false,
      ...(browserbaseRegion
        ? { browserbaseSessionCreateParams: { region: browserbaseRegion } }
        : {}),
    }
  : {
      ...baseConfig,
      env: "LOCAL",
      localBrowserLaunchOptions: {
        executablePath: process.env.CHROME_PATH,
        args: process.env.CI ? ["--no-sandbox"] : undefined,
        headless: true,
        viewport: { width: 1288, height: 711 },
      },
    };

export function getV3DynamicTestConfig(
  overrides: Partial<V3Options> = {},
): V3Options {
  return { ...v3DynamicTestConfig, ...overrides };
}

export default getV3DynamicTestConfig;


================================================
FILE: packages/core/tests/integration/v3.playwright.config.ts
================================================
import { defineConfig, type ReporterDescription } from "@playwright/test";
import { getPackageRootDir } from "../../lib/v3/runtimePaths.js";
const coreDir = getPackageRootDir();
const testDir = `${coreDir}/dist/esm/tests/integration`;

const browserTarget = (
  process.env.STAGEHAND_BROWSER_TARGET ?? "local"
).toLowerCase();
const isBrowserbase = browserTarget === "browserbase";
const consoleReporter = process.env.PLAYWRIGHT_CONSOLE_REPORTER ?? "list";

const localWorkerOverride = Number(
  process.env.LOCAL_SESSION_LIMIT_PER_E2E_TEST,
);
const localWorkers =
  Number.isFinite(localWorkerOverride) && localWorkerOverride > 0
    ? localWorkerOverride
    : process.env.CI
      ? 3
      : 5;

const ciWorkerOverride = Number(
  process.env.BROWSERBASE_SESSION_LIMIT_PER_E2E_TEST,
);
const bbWorkers =
  process.env.CI && Number.isFinite(ciWorkerOverride) && ciWorkerOverride > 0
    ? ciWorkerOverride
    : 3;

const ctrfJunitPath = process.env.CTRF_JUNIT_PATH;
const reporter: ReporterDescription[] = ctrfJunitPath
  ? [
      [consoleReporter] as ReporterDescription,
      [
        "junit",
        { outputFile: ctrfJunitPath, includeProjectInTestName: true },
      ] as ReporterDescription,
    ]
  : [[consoleReporter] as ReporterDescription];

export default defineConfig({
  testDir,
  timeout: 90_000,
  expect: { timeout: 10_000 },
  retries: process.env.CI ? 1 : 0,
  workers: isBrowserbase ? bbWorkers : localWorkers,
  fullyParallel: true,
  projects: [
    {
      name: isBrowserbase ? "e2e-bb" : "e2e-local",
    },
  ],
  reporter,
  use: {
    // we're not launching Playwright browsers in these tests; we connect via Puppeteer/CDP to V3.
    headless: false,
  },
});


================================================
FILE: packages/core/tests/integration/wait-for-selector.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe.configure({ mode: "serial" });
test.describe("Page.waitForSelector tests", () => {
  let v3: V3;

  test.beforeAll(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.beforeEach(async () => {
    const pages = v3.context.pages();
    if (pages.length === 0) {
      await v3.context.newPage("about:blank");
      return;
    }

    const [primary, ...extras] = pages;
    for (const page of extras) {
      await page.close().catch(() => {});
    }

    v3.context.setActivePage(primary);
    await primary.goto("about:blank", {
      waitUntil: "load",
      timeoutMs: 15_000,
    });
  });

  test.afterAll(async () => {
    await closeV3(v3);
  });

  test.describe("Basic state tests", () => {
    test("resolves when element is already visible", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent('<button id="submit-btn">Submit</button>'),
      );

      const result = await page.waitForSelector("#submit-btn");
      expect(result).toBe(true);
    });

    test("resolves when element appears after delay", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<div id='container'></div>" +
              "<script>" +
              "setTimeout(() => {" +
              "  const btn = document.createElement('button');" +
              "  btn.id = 'delayed-btn';" +
              "  btn.textContent = 'Delayed Button';" +
              "  document.getElementById('container').appendChild(btn);" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#delayed-btn", {
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("state 'attached' resolves for hidden elements", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="hidden-div" style="display: none;">Hidden Content</div>',
          ),
      );

      const result = await page.waitForSelector("#hidden-div", {
        state: "attached",
      });
      expect(result).toBe(true);
    });

    test("state 'visible' waits for element to become visible", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="show-later" style="display: none;">Now Visible</div>' +
              "<script>" +
              "setTimeout(() => {" +
              "  document.getElementById('show-later').style.display = 'block';" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#show-later", {
        state: "visible",
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("state 'hidden' waits for element to become hidden", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="hide-later" style="display: block;">Will Hide</div>' +
              "<script>" +
              "setTimeout(() => {" +
              "  document.getElementById('hide-later').style.display = 'none';" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#hide-later", {
        state: "hidden",
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("state 'detached' waits for element to be removed", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="remove-me">Will Be Removed</div>' +
              "<script>" +
              "setTimeout(() => {" +
              "  const el = document.getElementById('remove-me');" +
              "  el.parentNode.removeChild(el);" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#remove-me", {
        state: "detached",
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("state 'detached' resolves immediately for non-existent element", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," + encodeURIComponent("<div>Content</div>"),
      );

      const result = await page.waitForSelector("#does-not-exist", {
        state: "detached",
        timeout: 1000,
      });
      expect(result).toBe(true);
    });
  });

  test.describe("Timeout behavior", () => {
    test("throws on timeout when element never appears", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," + encodeURIComponent("<div>No button here</div>"),
      );

      let error: Error | null = null;
      try {
        await page.waitForSelector("#nonexistent", { timeout: 300 });
      } catch (e) {
        error = e as Error;
      }

      expect(error).not.toBeNull();
      expect(error?.message).toContain("Timeout");
      expect(error?.message).toContain("#nonexistent");
    });

    test("respects custom timeout duration", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," + encodeURIComponent("<div>Content</div>"),
      );

      const startTime = Date.now();
      try {
        await page.waitForSelector("#nonexistent", { timeout: 500 });
      } catch {
        // Expected to timeout
      }
      const elapsed = Date.now() - startTime;

      // Should timeout around 500ms (allow some margin)
      expect(elapsed).toBeGreaterThanOrEqual(450);
      expect(elapsed).toBeLessThan(2000);
    });
  });

  test.describe("CSS selector variants", () => {
    test("handles complex CSS selectors", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div class="container">' +
              '<form id="login-form">' +
              '<button type="submit">Login</button>' +
              "</form>" +
              "</div>",
          ),
      );

      const result = await page.waitForSelector(
        ".container #login-form button[type='submit']",
      );
      expect(result).toBe(true);
    });
  });

  test.describe("Open shadow DOM", () => {
    test("finds element inside open shadow DOM with pierceShadow: true", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="host"></div>' +
              "<script>" +
              'const host = document.getElementById("host");' +
              'const shadow = host.attachShadow({mode: "open"});' +
              'shadow.innerHTML = "<button id=\\"shadow-btn\\">Shadow Button</button>";' +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector("#shadow-btn", {
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("does NOT find shadow DOM element with pierceShadow: false", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="host"></div>' +
              "<script>" +
              'const host = document.getElementById("host");' +
              'const shadow = host.attachShadow({mode: "open"});' +
              'shadow.innerHTML = "<button id=\\"shadow-only-btn\\">Shadow Only</button>";' +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      let error: Error | null = null;
      try {
        await page.waitForSelector("#shadow-only-btn", {
          pierceShadow: false,
          timeout: 300,
        });
      } catch (e) {
        error = e as Error;
      }

      expect(error).not.toBeNull();
      expect(error?.message).toContain("Timeout");
    });

    test("finds element in nested open shadow DOM", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="outer-host"></div>' +
              "<script>" +
              'const outerHost = document.getElementById("outer-host");' +
              'const outerShadow = outerHost.attachShadow({mode: "open"});' +
              'outerShadow.innerHTML = "<div id=\\"inner-host\\"></div>";' +
              'const innerHost = outerShadow.getElementById("inner-host");' +
              'const innerShadow = innerHost.attachShadow({mode: "open"});' +
              'innerShadow.innerHTML = "<span id=\\"deep-element\\">Deep!</span>";' +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector("#deep-element", {
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });
  });

  test.describe("Closed shadow DOM (via piercer)", () => {
    test("finds element inside closed shadow DOM via custom element", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<closed-shadow-host></closed-shadow-host>" +
              "<script>" +
              "class ClosedShadowHost extends HTMLElement {" +
              "  constructor() {" +
              "    super();" +
              '    const shadow = this.attachShadow({mode: "closed"});' +
              '    shadow.innerHTML = "<button id=\\"closed-btn\\">Closed Shadow Button</button>";' +
              "  }" +
              "}" +
              "customElements.define('closed-shadow-host', ClosedShadowHost);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      // The piercer hooks attachShadow and stores closed shadow roots
      const result = await page.waitForSelector("#closed-btn", {
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("finds element in nested closed shadow DOM", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<outer-closed></outer-closed>" +
              "<script>" +
              "class InnerClosed extends HTMLElement {" +
              "  constructor() {" +
              "    super();" +
              '    const shadow = this.attachShadow({mode: "closed"});' +
              '    shadow.innerHTML = "<span id=\\"deeply-closed\\">Deeply Nested Closed</span>";' +
              "  }" +
              "}" +
              "customElements.define('inner-closed', InnerClosed);" +
              "" +
              "class OuterClosed extends HTMLElement {" +
              "  constructor() {" +
              "    super();" +
              '    const shadow = this.attachShadow({mode: "closed"});' +
              '    shadow.innerHTML = "<inner-closed></inner-closed>";' +
              "  }" +
              "}" +
              "customElements.define('outer-closed', OuterClosed);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector("#deeply-closed", {
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("finds element in mixed open/closed nested shadow DOM", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="open-host"></div>' +
              "<script>" +
              // Inner closed component
              "class ClosedInner extends HTMLElement {" +
              "  constructor() {" +
              "    super();" +
              '    const shadow = this.attachShadow({mode: "closed"});' +
              '    shadow.innerHTML = "<button id=\\"mixed-deep-btn\\">Mixed Deep Button</button>";' +
              "  }" +
              "}" +
              "customElements.define('closed-inner', ClosedInner);" +
              // Outer open shadow
              'const openHost = document.getElementById("open-host");' +
              'const openShadow = openHost.attachShadow({mode: "open"});' +
              'openShadow.innerHTML = "<closed-inner></closed-inner>";' +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector("#mixed-deep-btn", {
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("waits for element to appear inside closed shadow DOM", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<delayed-closed-host></delayed-closed-host>" +
              "<script>" +
              "class DelayedClosedHost extends HTMLElement {" +
              "  constructor() {" +
              "    super();" +
              '    const shadow = this.attachShadow({mode: "closed"});' +
              '    shadow.innerHTML = "<div id=\\"container\\"></div>";' +
              "    setTimeout(() => {" +
              '      shadow.getElementById("container").innerHTML = ' +
              '        "<button id=\\"delayed-closed-btn\\">Appeared!</button>";' +
              "    }, 300);" +
              "  }" +
              "}" +
              "customElements.define('delayed-closed-host', DelayedClosedHost);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );

      const result = await page.waitForSelector("#delayed-closed-btn", {
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });
  });

  test.describe("XPath selectors", () => {
    test("finds element with basic XPath", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent('<button id="xpath-btn">XPath Button</button>'),
      );

      const result = await page.waitForSelector("//button[@id='xpath-btn']", {
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("finds element with xpath= prefix", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="container"><span class="target">Target</span></div>',
          ),
      );

      const result = await page.waitForSelector(
        "xpath=//span[@class='target']",
        {
          timeout: 5000,
        },
      );
      expect(result).toBe(true);
    });

    test("waits for element to appear with XPath", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<div id='container'></div>" +
              "<script>" +
              "setTimeout(() => {" +
              '  document.getElementById("container").innerHTML = ' +
              '    "<span id=\\"delayed-xpath\\">Delayed XPath</span>";' +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("//span[@id='delayed-xpath']", {
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("finds element in open shadow DOM with XPath", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="host"></div>' +
              "<script>" +
              'const host = document.getElementById("host");' +
              'const shadow = host.attachShadow({mode: "open"});' +
              'shadow.innerHTML = "<button id=\\"shadow-xpath-btn\\">Shadow XPath</button>";' +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector(
        "//button[@id='shadow-xpath-btn']",
        {
          pierceShadow: true,
          timeout: 5000,
        },
      );
      expect(result).toBe(true);
    });

    test("finds element in closed shadow DOM with XPath", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<xpath-closed-host></xpath-closed-host>" +
              "<script>" +
              "class XPathClosedHost extends HTMLElement {" +
              "  constructor() {" +
              "    super();" +
              '    const shadow = this.attachShadow({mode: "closed"});' +
              '    shadow.innerHTML = "<span id=\\"xpath-closed-target\\">Closed XPath Target</span>";' +
              "  }" +
              "}" +
              "customElements.define('xpath-closed-host', XPathClosedHost);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector(
        "//span[@id='xpath-closed-target']",
        {
          pierceShadow: true,
          timeout: 5000,
        },
      );
      expect(result).toBe(true);
    });
  });

  test.describe("Iframe hop notation (>>)", () => {
    test("finds element inside single iframe", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<button id="main-btn">Main Button</button>' +
              '<iframe id="my-frame"></iframe>' +
              "<script>" +
              'const frame = document.getElementById("my-frame");' +
              "const doc = frame.contentDocument;" +
              "doc.open();" +
              'doc.write("<button id=\\"frame-btn\\">Frame Button</button>");' +
              "doc.close();" +
              "</script>",
          ),
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector(
        "iframe#my-frame >> #frame-btn",
        {
          timeout: 5000,
        },
      );
      expect(result).toBe(true);
    });

    test("finds element through multiple iframe hops", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<iframe id="outer-frame"></iframe>' +
              "<script>" +
              'const outerFrame = document.getElementById("outer-frame");' +
              "const outerDoc = outerFrame.contentDocument;" +
              "outerDoc.open();" +
              'outerDoc.write("<iframe id=\\"inner-frame\\"></iframe>");' +
              "outerDoc.close();" +
              "setTimeout(() => {" +
              '  const innerFrame = outerDoc.getElementById("inner-frame");' +
              "  const innerDoc = innerFrame.contentDocument;" +
              "  innerDoc.open();" +
              '  innerDoc.write("<div id=\\"nested-content\\">Deeply Nested</div>");' +
              "  innerDoc.close();" +
              "}, 100);" +
              "</script>",
          ),
      );
      await page.waitForTimeout(300);

      const result = await page.waitForSelector(
        "iframe#outer-frame >> iframe#inner-frame >> #nested-content",
        { timeout: 5000 },
      );
      expect(result).toBe(true);
    });

    test("waits for element to appear inside iframe", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<iframe id="delay-frame"></iframe>' +
              "<script>" +
              'const frame = document.getElementById("delay-frame");' +
              "const doc = frame.contentDocument;" +
              "doc.open();" +
              'doc.write("<div id=\\"container\\"></div>");' +
              "doc.close();" +
              "setTimeout(() => {" +
              '  doc.getElementById("container").innerHTML = ' +
              '    "<span id=\\"delayed-in-frame\\">Appeared!</span>";' +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector(
        "iframe#delay-frame >> #delayed-in-frame",
        {
          timeout: 5000,
        },
      );
      expect(result).toBe(true);
    });
  });

  test.describe("Visibility edge cases", () => {
    test("visibility: hidden is not visible", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="vis-hidden" style="visibility: hidden;">Hidden</div>',
          ),
      );

      // Should be attached but not visible
      const attached = await page.waitForSelector("#vis-hidden", {
        state: "attached",
      });
      expect(attached).toBe(true);

      let error: Error | null = null;
      try {
        await page.waitForSelector("#vis-hidden", {
          state: "visible",
          timeout: 200,
        });
      } catch (e) {
        error = e as Error;
      }
      expect(error).not.toBeNull();
    });

    test("opacity: 0 is not visible", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="transparent" style="opacity: 0;">Transparent</div>',
          ),
      );

      const attached = await page.waitForSelector("#transparent", {
        state: "attached",
      });
      expect(attached).toBe(true);

      let error: Error | null = null;
      try {
        await page.waitForSelector("#transparent", {
          state: "visible",
          timeout: 200,
        });
      } catch (e) {
        error = e as Error;
      }
      expect(error).not.toBeNull();
    });

    test("zero dimensions is not visible", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="zero-size" style="width: 0; height: 0;">Zero</div>',
          ),
      );

      const attached = await page.waitForSelector("#zero-size", {
        state: "attached",
      });
      expect(attached).toBe(true);

      let error: Error | null = null;
      try {
        await page.waitForSelector("#zero-size", {
          state: "visible",
          timeout: 200,
        });
      } catch (e) {
        error = e as Error;
      }
      expect(error).not.toBeNull();
    });

    test("detects visibility change via class toggle", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<style>.hidden { display: none; }</style>" +
              '<div id="class-toggle" class="hidden">Class Toggle</div>' +
              "<script>" +
              "setTimeout(() => {" +
              "  document.getElementById('class-toggle').classList.remove('hidden');" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#class-toggle", {
        state: "visible",
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("detects visibility change via style attribute", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="style-toggle" style="display: none;">Style Toggle</div>' +
              "<script>" +
              "setTimeout(() => {" +
              "  document.getElementById('style-toggle').style.display = 'block';" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#style-toggle", {
        state: "visible",
        timeout: 5000,
      });
      expect(result).toBe(true);
    });
  });

  test.describe("Dynamic DOM scenarios", () => {
    test("handles rapid DOM mutations", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            "<div id='container'></div>" +
              "<script>" +
              "let count = 0;" +
              "const interval = setInterval(() => {" +
              "  count++;" +
              "  const div = document.createElement('div');" +
              "  div.id = 'item-' + count;" +
              "  div.textContent = 'item';" +
              "  document.getElementById('container').appendChild(div);" +
              "  if (count >= 10) clearInterval(interval);" +
              "}, 50);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      // Small delay to ensure script starts
      await page.waitForTimeout(50);

      const result = await page.waitForSelector("#item-7", { timeout: 10000 });
      expect(result).toBe(true);
    });

    test("handles element removed and re-added", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent('<div id="toggle-me">Toggle</div>'),
      );

      const browserTarget = (
        process.env.STAGEHAND_BROWSER_TARGET ?? "local"
      ).toLowerCase();
      const isBrowserbase = browserTarget === "browserbase";
      const removeDelayMs = isBrowserbase ? 1000 : 200;
      const addDelayMs = isBrowserbase ? 1600 : 500;
      const waitTimeoutMs = isBrowserbase ? 10000 : 5000;

      // Start waiting before scheduling DOM changes to avoid racey timing in CI.
      const detachedPromise = page.waitForSelector("#toggle-me", {
        state: "detached",
        timeout: waitTimeoutMs,
      });
      await page.evaluate(
        ({ removeDelay, addDelay }) => {
          const el = document.getElementById("toggle-me");
          const parent = el?.parentNode;
          if (!el || !parent) return;
          setTimeout(() => parent.removeChild(el), removeDelay);
          setTimeout(() => parent.appendChild(el), addDelay);
        },
        { removeDelay: removeDelayMs, addDelay: addDelayMs },
      );

      const detached = await detachedPromise;
      expect(detached).toBe(true);

      // Then wait for visible again
      const visible = await page.waitForSelector("#toggle-me", {
        state: "visible",
        timeout: waitTimeoutMs,
      });
      expect(visible).toBe(true);
    });

    test("handles dynamically replaced innerHTML", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="container">Loading...</div>' +
              "<script>" +
              "setTimeout(() => {" +
              '  document.getElementById("container").innerHTML = ' +
              '    "<button id=\\"loaded-btn\\">Loaded!</button>";' +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#loaded-btn", {
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("handles element created via insertAdjacentHTML", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="anchor"></div>' +
              "<script>" +
              "setTimeout(() => {" +
              '  document.getElementById("anchor").insertAdjacentHTML(' +
              '    "afterend", "<div id=\\"inserted\\">Inserted</div>"' +
              "  );" +
              "}, 300);" +
              "</script>",
          ),
      );

      const result = await page.waitForSelector("#inserted", { timeout: 5000 });
      expect(result).toBe(true);
    });
  });

  test.describe("Shadow DOM visibility changes", () => {
    test("detects element becoming visible inside open shadow DOM", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="host"></div>' +
              "<script>" +
              'const host = document.getElementById("host");' +
              'const shadow = host.attachShadow({mode: "open"});' +
              'shadow.innerHTML = "<button id=\\"shadow-btn\\" style=\\"display:none\\">Shadow</button>";' +
              "setTimeout(() => {" +
              '  shadow.getElementById("shadow-btn").style.display = "block";' +
              "}, 300);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );

      const result = await page.waitForSelector("#shadow-btn", {
        state: "visible",
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });

    test("detects element becoming hidden inside shadow DOM", async () => {
      const page = v3.context.pages()[0];
      await page.goto(
        "data:text/html," +
          encodeURIComponent(
            '<div id="host"></div>' +
              "<script>" +
              'const host = document.getElementById("host");' +
              'const shadow = host.attachShadow({mode: "open"});' +
              'shadow.innerHTML = "<button id=\\"hide-shadow-btn\\">Will Hide</button>";' +
              "setTimeout(() => {" +
              '  shadow.getElementById("hide-shadow-btn").style.display = "none";' +
              "}, 300);" +
              "</script>",
          ),
        { waitUntil: "load", timeoutMs: 30000 },
      );
      await page.waitForTimeout(100);

      const result = await page.waitForSelector("#hide-shadow-btn", {
        state: "hidden",
        pierceShadow: true,
        timeout: 5000,
      });
      expect(result).toBe(true);
    });
  });
});


================================================
FILE: packages/core/tests/integration/wait-for-timeout.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { closeV3 } from "./testUtils.js";

test.describe("Page.waitForTimeout tests", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("waitForTimeout resolves after specified duration", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," + encodeURIComponent("<div>Test Page</div>"),
    );

    const startTime = Date.now();
    await page.waitForTimeout(200);
    const elapsed = Date.now() - startTime;

    // Should have waited at least 200ms (allow some tolerance)
    expect(elapsed).toBeGreaterThanOrEqual(190);
  });

  test("waitForTimeout resolves immediately for 0ms", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," + encodeURIComponent("<div>Test Page</div>"),
    );

    const startTime = Date.now();
    await page.waitForTimeout(0);
    const elapsed = Date.now() - startTime;

    // Should resolve nearly immediately (within 50ms tolerance)
    expect(elapsed).toBeLessThan(50);
  });

  test("waitForTimeout can be chained with other operations", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          "<div id='counter'>0</div>" +
            "<script>" +
            "let count = 0;" +
            "setInterval(() => {" +
            "  count++;" +
            "  document.getElementById('counter').textContent = count;" +
            "}, 100);" +
            "</script>",
        ),
    );

    // Wait for counter to increment
    await page.waitForTimeout(350);

    // Counter should have incremented at least 3 times
    const text = await page.mainFrame().locator("#counter").textContent();
    expect(parseInt(text ?? "0")).toBeGreaterThanOrEqual(3);
  });

  test("waitForTimeout works with async/await syntax", async () => {
    const page = v3.context.pages()[0];

    await page.goto("data:text/html," + encodeURIComponent("<div>Test</div>"));

    const results: number[] = [];

    results.push(1);
    await page.waitForTimeout(50);
    results.push(2);
    await page.waitForTimeout(50);
    results.push(3);

    expect(results).toEqual([1, 2, 3]);
  });

  test("waitForTimeout allows DOM to update", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          "<div id='delayed'></div>" +
            "<script>" +
            "window.startUpdate = () => {" +
            "  setTimeout(() => {" +
            "    document.getElementById('delayed').textContent = 'Loaded';" +
            "  }, 200);" +
            "};" +
            "</script>",
        ),
    );

    // Trigger the delayed update
    await page.evaluate(() => {
      (window as unknown as { startUpdate: () => void }).startUpdate();
    });

    // Wait for the timeout to allow DOM update
    await page.waitForTimeout(300);

    // Content should now be loaded
    const afterText = await page.mainFrame().locator("#delayed").textContent();
    expect(afterText).toBe("Loaded");
  });

  test("waitForTimeout with small increments", async () => {
    const page = v3.context.pages()[0];

    await page.goto("data:text/html," + encodeURIComponent("<div>Test</div>"));

    const startTime = Date.now();

    // Multiple small waits
    await page.waitForTimeout(50);
    await page.waitForTimeout(50);
    await page.waitForTimeout(50);
    await page.waitForTimeout(50);

    const elapsed = Date.now() - startTime;

    // Should have waited at least 200ms total (4 * 50ms)
    expect(elapsed).toBeGreaterThanOrEqual(190);
  });

  test("waitForTimeout does not block other async operations", async () => {
    const page = v3.context.pages()[0];

    await page.goto(
      "data:text/html," +
        encodeURIComponent(
          "<div id='async-test'>Initial</div>" +
            "<script>" +
            "window.updateText = () => {" +
            "  document.getElementById('async-test').textContent = 'Updated';" +
            "};" +
            "</script>",
        ),
    );

    // Start a timeout
    const timeoutPromise = page.waitForTimeout(100);

    // Execute something else while waiting
    await page.evaluate(() => {
      (window as unknown as { updateText: () => void }).updateText();
    });

    // Verify the update happened
    const text = await page.mainFrame().locator("#async-test").textContent();
    expect(text).toBe("Updated");

    // Wait for the timeout to complete
    await timeoutPromise;
  });
});


================================================
FILE: packages/core/tests/integration/xpath-for-location-deep.spec.ts
================================================
import { expect, test } from "@playwright/test";
import { V3 } from "../../lib/v3/v3.js";
import { v3DynamicTestConfig } from "./v3.dynamic.config.js";
import { resolveXpathForLocation } from "../../lib/v3/understudy/a11y/snapshot/index.js";
import { executionContexts } from "../../lib/v3/understudy/executionContextRegistry.js";
import { closeV3 } from "./testUtils.js";

test.describe("resolveNodeForLocationDeep", () => {
  let v3: V3;

  test.beforeEach(async () => {
    v3 = new V3(v3DynamicTestConfig);
    await v3.init();
  });

  test.afterEach(async () => {
    await closeV3(v3);
  });

  test("click resolves inside same-process iframe and returns absolute XPath", async () => {
    const page = await v3.context.awaitActivePage();

    // Set consistent viewport size to ensure stable rendering across environments
    await page.setViewportSize(1280, 720);

    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-hn/",
      { waitUntil: "networkidle" },
    );

    await page.waitForSelector("section iframe", {
      state: "attached",
      timeout: 10000,
    });
    const frame = await page.frameLocator("section iframe").resolveFrame();
    await executionContexts.waitForMainWorld(
      frame.session,
      frame.frameId,
      5000,
    );

    // scroll to the bottom of the page
    await page.evaluate(() => {
      window.scrollTo(0, document.body.scrollHeight);
    });

    // scroll to the bottom of the iframe
    await frame.evaluate(() => {
      window.scrollTo(0, document.body.scrollHeight);
    });

    // Wait a bit for the iframe content to settle after scrolling
    await new Promise((resolve) => setTimeout(resolve, 500));

    // Get the iframe's position in the main page
    const iframeOffset = await page.evaluate(() => {
      const iframe = document.querySelector("section iframe");
      if (!iframe) return null;
      const rect = iframe.getBoundingClientRect();
      return {
        left: rect.left,
        top: rect.top,
      };
    });

    // Get the link's position within the iframe
    const linkOffsetInFrame = await frame.evaluate(() => {
      // Find the 88th row, 3rd column link (the one we're testing)
      const table = document.querySelector(
        "center > table > tbody > tr:nth-child(3) > td > table",
      );
      if (!table) return null;

      const row88 = table.querySelector("tbody > tr:nth-child(88)");
      if (!row88) return null;

      const cell3 = row88.querySelector("td:nth-child(3)");
      if (!cell3) return null;

      const link = cell3.querySelector("span > a");
      if (!link) return null;

      const rect = link.getBoundingClientRect();
      // Return center coordinates of the link relative to iframe
      return {
        x: rect.left + rect.width / 2,
        y: rect.top + rect.height / 2,
      };
    });

    // Combine iframe offset and link offset to get page-level coordinates
    // Fallback to hardcoded coordinates if element not found (shouldn't happen)
    const x =
      iframeOffset && linkOffsetInFrame
        ? iframeOffset.left + linkOffsetInFrame.x
        : 356;
    const y =
      iframeOffset && linkOffsetInFrame
        ? iframeOffset.top + linkOffsetInFrame.y
        : 503;

    const result = await resolveXpathForLocation(page, x, y);
    console.log("=== Coordinates used:", { x, y });
    console.log("=== Result:", result);
    const xpath = result.absoluteXPath;
    expect(xpath).toBe(
      "/html[1]/body[1]/main[1]/section[3]/iframe[1]/html[1]/body[1]/center[1]/table[1]/tbody[1]/tr[3]/td[1]/table[1]/tbody[1]/tr[88]/td[3]/span[1]/a[1]",
    );
  });
});


================================================
FILE: packages/core/tests/unit/agent-captcha-hooks.test.ts
================================================
import { beforeEach, describe, expect, it, vi } from "vitest";
import type { LogLine } from "../../lib/v3/types/public/logs.js";
import { CaptchaSolver } from "../../lib/v3/agent/utils/captchaSolver.js";
import { V3AgentHandler } from "../../lib/v3/handlers/v3AgentHandler.js";

const SOLVING_STARTED = "browserbase-solving-started";
const SOLVING_FINISHED = "browserbase-solving-finished";
const SOLVING_ERRORED = "browserbase-solving-errored";

type ConsoleListener = (message: { text: () => string }) => void;

class MockPage {
  private listeners = new Set<ConsoleListener>();
  public captchaBoxes: Array<{
    left: number;
    top: number;
    right: number;
    bottom: number;
  }> = [];

  on(event: string, listener: ConsoleListener): void {
    if (event === "console") {
      this.listeners.add(listener);
    }
  }

  off(event: string, listener: ConsoleListener): void {
    if (event === "console") {
      this.listeners.delete(listener);
    }
  }

  emitConsole(text: string): void {
    const message = { text: () => text };
    for (const listener of this.listeners) {
      listener(message);
    }
  }

  url(): string {
    return "https://example.com";
  }

  async screenshot(): Promise<Buffer> {
    return Buffer.from("fake-image");
  }

  async evaluate<T>(): Promise<T> {
    return this.captchaBoxes as T;
  }

  mainFrame(): { evaluate: () => Promise<{ w: number; h: number }> } {
    return {
      evaluate: async () => ({ w: 1288, h: 711 }),
    };
  }
}

class FakeCuaClient {
  public contextNotes: string[] = [];
  public preStepHook?: () => Promise<void>;
  public actionHandler?: (action: Record<string, unknown>) => Promise<void>;
  public executeImpl = vi.fn(async (options: unknown) => {
    void options;
    return {
      success: true,
      message: "ok",
      actions: [],
      completed: true,
    };
  });
  public captureScreenshot = vi.fn(async () => null);
  public setViewport = vi.fn();
  public setCurrentUrl = vi.fn();
  public setScreenshotProvider = vi.fn();
  public setSafetyConfirmationHandler = vi.fn();

  setActionHandler(
    handler: (action: Record<string, unknown>) => Promise<void>,
  ): void {
    this.actionHandler = handler;
  }

  setPreStepHook(handler: () => Promise<void>): void {
    this.preStepHook = handler;
  }

  addContextNote(note: string): void {
    this.contextNotes.push(note);
  }

  async execute(options: unknown): Promise<{
    success: boolean;
    message: string;
    actions: unknown[];
    completed: boolean;
  }> {
    return this.executeImpl(options);
  }
}

let fakeCuaClient: FakeCuaClient;

vi.mock("../../lib/v3/agent/AgentProvider", () => ({
  AgentProvider: class {
    constructor(logger: unknown) {
      void logger;
    }

    getClient(): FakeCuaClient {
      return fakeCuaClient;
    }
  },
}));

import { V3CuaAgentHandler } from "../../lib/v3/handlers/v3CuaAgentHandler.js";

function collectUserMessages(
  messages: Array<{ role: string; content: unknown }>,
): Array<{ role: "user"; content: string }> {
  return messages.filter(
    (message): message is { role: "user"; content: string } =>
      message.role === "user" && typeof message.content === "string",
  );
}

describe("agent captcha hooks", () => {
  let page: MockPage;
  let logs: LogLine[];
  let logger: (line: LogLine) => void;

  beforeEach(() => {
    page = new MockPage();
    logs = [];
    logger = (line) => {
      logs.push(line);
    };
    fakeCuaClient = new FakeCuaClient();
  });

  it("blocks regular agent prepareStep until the solver finishes and injects one solved message", async () => {
    const handler = new V3AgentHandler(
      {
        isCaptchaAutoSolveEnabled: true,
      } as never,
      logger,
      {} as never,
    );
    const solver = new CaptchaSolver();
    solver.init(async () => page as never);

    const userCallback = vi.fn(async (options) => options);
    const prepareStep = (
      handler as unknown as {
        createPrepareStep: (
          callback?: (options: Record<string, unknown>) => Promise<unknown>,
          captchaSolver?: CaptchaSolver,
        ) => (options: Record<string, unknown>) => Promise<unknown>;
      }
    ).createPrepareStep(userCallback, solver);

    const options = {
      messages: [{ role: "user", content: "start" }],
    };

    await prepareStep(options);
    page.emitConsole(SOLVING_STARTED);

    const secondCall = prepareStep(options);
    await Promise.resolve();
    expect(userCallback).toHaveBeenCalledTimes(1);

    page.emitConsole(SOLVING_FINISHED);
    await secondCall;

    expect(userCallback).toHaveBeenCalledTimes(2);
    expect(
      collectUserMessages(
        options.messages as Array<{ role: string; content: unknown }>,
      ).filter((message) =>
        message.content.includes("automatically detected and solved"),
      ),
    ).toHaveLength(1);
  });

  it("injects one error message when the regular agent solver errors", async () => {
    const handler = new V3AgentHandler(
      {
        isCaptchaAutoSolveEnabled: true,
      } as never,
      logger,
      {} as never,
    );
    const solver = new CaptchaSolver();
    solver.init(async () => page as never);

    const prepareStep = (
      handler as unknown as {
        createPrepareStep: (
          callback?: (options: Record<string, unknown>) => Promise<unknown>,
          captchaSolver?: CaptchaSolver,
        ) => (options: Record<string, unknown>) => Promise<unknown>;
      }
    ).createPrepareStep(undefined, solver);

    const options = {
      messages: [{ role: "user", content: "start" }],
    };

    await prepareStep(options);
    page.emitConsole(SOLVING_STARTED);

    const pending = prepareStep(options);
    page.emitConsole(SOLVING_ERRORED);
    await pending;

    expect(
      collectUserMessages(
        options.messages as Array<{ role: string; content: unknown }>,
      ).filter((message) =>
        message.content.includes("automatic captcha solver failed"),
      ),
    ).toHaveLength(1);
  });

  it("pauses the CUA loop at prepareStep while Browserbase solves a captcha", async () => {
    let secondPrepareStarted = false;

    fakeCuaClient.executeImpl = vi.fn(async () => {
      await fakeCuaClient.preStepHook?.();
      page.emitConsole(SOLVING_STARTED);

      const blockedPrepare = fakeCuaClient.preStepHook?.() ?? Promise.resolve();
      secondPrepareStarted = true;
      await blockedPrepare;

      return {
        success: true,
        message: "ok",
        actions: [],
        completed: true,
      };
    });

    const handler = new V3CuaAgentHandler(
      {
        context: {
          awaitActivePage: async () => page,
        },
        bus: { emit: vi.fn() },
        isCaptchaAutoSolveEnabled: true,
        isAdvancedStealth: false,
        configuredViewport: { width: 1288, height: 711 },
        isAgentReplayActive: () => false,
        updateMetrics: vi.fn(),
      } as never,
      logger,
      {
        modelName: "anthropic/claude-haiku-4-5-20251001",
        clientOptions: { waitBetweenActions: 1 },
      } as never,
    );

    const execution = handler.execute({
      instruction: "Describe the page briefly.",
      highlightCursor: false,
    });

    await vi.waitFor(() => {
      expect(secondPrepareStarted).toBe(true);
      expect(
        logs.some((line) =>
          line.message.includes("waiting for Browserbase to solve"),
        ),
      ).toBe(true);
    });

    expect(logs.some((line) => line.message.includes("Captcha solved"))).toBe(
      false,
    );

    page.emitConsole(SOLVING_FINISHED);
    await execution;

    expect(fakeCuaClient.contextNotes).toEqual([
      expect.stringContaining("automatically detected and solved"),
    ]);
    expect(logs.some((line) => line.message.includes("Captcha solved"))).toBe(
      true,
    );
  });

  it("pauses CUA actions until the captcha solver finishes", async () => {
    let actionStarted = false;

    fakeCuaClient.executeImpl = vi.fn(async () => {
      await fakeCuaClient.preStepHook?.();
      page.emitConsole(SOLVING_STARTED);

      const pendingAction =
        fakeCuaClient.actionHandler?.({ type: "screenshot" }) ??
        Promise.resolve();
      actionStarted = true;
      await pendingAction;

      return {
        success: true,
        message: "ok",
        actions: [],
        completed: true,
      };
    });

    const handler = new V3CuaAgentHandler(
      {
        context: {
          awaitActivePage: async () => page,
        },
        bus: { emit: vi.fn() },
        isCaptchaAutoSolveEnabled: true,
        isAdvancedStealth: false,
        configuredViewport: { width: 1288, height: 711 },
        isAgentReplayActive: () => false,
        updateMetrics: vi.fn(),
      } as never,
      logger,
      {
        modelName: "anthropic/claude-haiku-4-5-20251001",
        clientOptions: { waitBetweenActions: 1 },
      } as never,
    );
    const executeActionSpy = vi
      .spyOn(
        handler as unknown as {
          executeAction: (action: Record<string, unknown>) => Promise<unknown>;
        },
        "executeAction",
      )
      .mockResolvedValue({ success: true });
    vi.spyOn(handler, "captureAndSendScreenshot").mockResolvedValue(null);

    const execution = handler.execute({
      instruction: "Describe the page briefly.",
      highlightCursor: false,
    });

    await vi.waitFor(() => {
      expect(actionStarted).toBe(true);
    });

    expect(executeActionSpy).not.toHaveBeenCalled();
    page.emitConsole(SOLVING_FINISHED);
    await execution;

    expect(executeActionSpy).toHaveBeenCalledTimes(1);
    expect(fakeCuaClient.contextNotes).toEqual([
      expect.stringContaining("automatically detected and solved"),
    ]);
    expect(logs.some((line) => line.message.includes("Captcha solved"))).toBe(
      true,
    );
  });

  it("skips post-solve clicks on the captcha widget and injects another note", async () => {
    page.captchaBoxes = [{ left: 0, top: 400, right: 140, bottom: 470 }];

    fakeCuaClient.executeImpl = vi.fn(async () => {
      await fakeCuaClient.preStepHook?.();
      page.emitConsole(SOLVING_STARTED);

      const blockedPrepare = fakeCuaClient.preStepHook?.() ?? Promise.resolve();
      page.emitConsole(SOLVING_FINISHED);
      await blockedPrepare;

      await fakeCuaClient.actionHandler?.({
        type: "click",
        button: "left",
        x: 63,
        y: 436,
      });

      return {
        success: true,
        message: "ok",
        actions: [],
        completed: true,
      };
    });

    const handler = new V3CuaAgentHandler(
      {
        context: {
          awaitActivePage: async () => page,
        },
        bus: { emit: vi.fn() },
        isCaptchaAutoSolveEnabled: true,
        isAdvancedStealth: false,
        configuredViewport: { width: 1288, height: 711 },
        isAgentReplayActive: () => false,
        updateMetrics: vi.fn(),
      } as never,
      logger,
      {
        modelName: "anthropic/claude-haiku-4-5-20251001",
        clientOptions: { waitBetweenActions: 1 },
      } as never,
    );
    const executeActionSpy = vi
      .spyOn(
        handler as unknown as {
          executeAction: (action: Record<string, unknown>) => Promise<unknown>;
        },
        "executeAction",
      )
      .mockResolvedValue({ success: true });
    vi.spyOn(handler, "captureAndSendScreenshot").mockResolvedValue(null);

    await handler.execute({
      instruction: "Describe the page briefly.",
      highlightCursor: false,
    });

    expect(executeActionSpy).not.toHaveBeenCalled();
    expect(fakeCuaClient.contextNotes).toEqual([
      expect.stringContaining("automatically detected and solved"),
      expect.stringContaining("Original task: Describe the page briefly."),
    ]);
    expect(
      logs.some((line) =>
        line.message.includes("Skipped click on solved captcha widget"),
      ),
    ).toBe(true);
  });
});


================================================
FILE: packages/core/tests/unit/agent-execution-model.test.ts
================================================
import { describe, expect, it, vi } from "vitest";
import { actTool } from "../../lib/v3/agent/tools/act.js";
import { extractTool } from "../../lib/v3/agent/tools/extract.js";
import { fillFormTool } from "../../lib/v3/agent/tools/fillform.js";
import type { V3 } from "../../lib/v3/v3.js";

/**
 * Minimal mock of V3 that captures how tools pass `model` options
 * into v3.act(), v3.extract(), and v3.observe().
 */
function createMockV3() {
  const calls: { method: string; model: unknown }[] = [];

  const mock = {
    logger: vi.fn(),
    recordAgentReplayStep: vi.fn(),
    act: vi.fn(async (_instruction: unknown, options?: { model?: unknown }) => {
      calls.push({ method: "act", model: options?.model });
      return {
        success: true,
        message: "ok",
        actionDescription: "clicked",
        actions: [],
      };
    }),
    extract: vi.fn(
      async (
        _instruction: unknown,
        _schema: unknown,
        options?: { model?: unknown },
      ) => {
        calls.push({ method: "extract", model: options?.model });
        return { extraction: "data" };
      },
    ),
    observe: vi.fn(
      async (_instruction: unknown, options?: { model?: unknown }) => {
        calls.push({ method: "observe", model: options?.model });
        return [];
      },
    ),
    calls,
  };

  return mock as unknown as V3 & { calls: typeof calls };
}

describe("agent tools pass full executionModel config to v3 methods", () => {
  const modelConfig = {
    modelName: "openai/gpt-4o-mini",
    apiKey: "sk-test-key",
    baseURL: "https://custom.api",
  };

  it("actTool passes AgentModelConfig object to v3.act()", async () => {
    const v3 = createMockV3();
    const tool = actTool(v3, modelConfig);
    await tool.execute!(
      { action: "click the button" },
      {
        toolCallId: "t1",
        messages: [],
        abortSignal: new AbortController().signal,
      },
    );

    expect(v3.calls).toHaveLength(1);
    expect(v3.calls[0].method).toBe("act");
    expect(v3.calls[0].model).toBe(modelConfig);
  });

  it("extractTool passes AgentModelConfig object to v3.extract()", async () => {
    const v3 = createMockV3();
    const tool = extractTool(v3, modelConfig);
    await tool.execute!(
      { instruction: "get the title", schema: undefined },
      {
        toolCallId: "t2",
        messages: [],
        abortSignal: new AbortController().signal,
      },
    );

    expect(v3.calls).toHaveLength(1);
    expect(v3.calls[0].method).toBe("extract");
    expect(v3.calls[0].model).toBe(modelConfig);
  });

  it("fillFormTool passes AgentModelConfig object to v3.observe()", async () => {
    const v3 = createMockV3();
    const tool = fillFormTool(v3, modelConfig);
    await tool.execute!(
      { fields: [{ action: "type hello into name" }] },
      {
        toolCallId: "t3",
        messages: [],
        abortSignal: new AbortController().signal,
      },
    );

    expect(v3.calls).toHaveLength(1);
    expect(v3.calls[0].method).toBe("observe");
    expect(v3.calls[0].model).toBe(modelConfig);
  });

  it("actTool passes undefined when no executionModel is set", async () => {
    const v3 = createMockV3();
    const tool = actTool(v3, undefined);
    await tool.execute!(
      { action: "click the button" },
      {
        toolCallId: "t4",
        messages: [],
        abortSignal: new AbortController().signal,
      },
    );

    expect(v3.calls).toHaveLength(1);
    expect(v3.calls[0].model).toBeUndefined();
  });

  it("actTool passes plain string executionModel to v3.act()", async () => {
    const v3 = createMockV3();
    const tool = actTool(v3, "openai/gpt-4o-mini");
    await tool.execute!(
      { action: "click the button" },
      {
        toolCallId: "t5",
        messages: [],
        abortSignal: new AbortController().signal,
      },
    );

    expect(v3.calls).toHaveLength(1);
    expect(v3.calls[0].model).toBe("openai/gpt-4o-mini");
  });
});

describe("executionModel fallback logic", () => {
  // This mirrors the resolution in V3.prepareAgentExecution (v3.ts:1682):
  //   const resolvedExecutionModel = options?.executionModel ?? options?.model;
  function resolveExecutionModel(options?: {
    executionModel?: string | { modelName: string };
    model?: string | { modelName: string };
  }) {
    return options?.executionModel ?? options?.model;
  }

  it("prefers explicit executionModel over model", () => {
    const result = resolveExecutionModel({
      executionModel: "openai/gpt-4o-mini",
      model: "anthropic/claude-sonnet-4-20250514",
    });
    expect(result).toBe("openai/gpt-4o-mini");
  });

  it("falls back to model when executionModel is not set", () => {
    const modelConfig = {
      modelName: "anthropic/claude-sonnet-4-20250514",
      apiKey: "sk-test",
    };
    const result = resolveExecutionModel({ model: modelConfig });
    expect(result).toBe(modelConfig);
  });

  it("returns undefined when neither is set", () => {
    expect(resolveExecutionModel({})).toBeUndefined();
    expect(resolveExecutionModel(undefined)).toBeUndefined();
  });
});


================================================
FILE: packages/core/tests/unit/api-multiregion.test.ts
================================================
import { describe, expect, it } from "vitest";
import { getApiUrlForRegion, REGION_API_URLS } from "../../lib/v3/api";

describe("Multi-region API URL mapping", () => {
  describe("REGION_API_URLS constant", () => {
    it("should have the correct URL for us-west-2 (default)", () => {
      expect(REGION_API_URLS["us-west-2"]).toBe(
        "https://api.stagehand.browserbase.com",
      );
    });

    it("should have the correct URL for us-east-1", () => {
      expect(REGION_API_URLS["us-east-1"]).toBe(
        "https://api.use1.stagehand.browserbase.com",
      );
    });

    it("should have the correct URL for eu-central-1", () => {
      expect(REGION_API_URLS["eu-central-1"]).toBe(
        "https://api.euc1.stagehand.browserbase.com",
      );
    });

    it("should have the correct URL for ap-southeast-1", () => {
      expect(REGION_API_URLS["ap-southeast-1"]).toBe(
        "https://api.apse1.stagehand.browserbase.com",
      );
    });
  });

  describe("getApiUrlForRegion", () => {
    it("should return the correct URL for us-west-2", () => {
      expect(getApiUrlForRegion("us-west-2")).toBe(
        "https://api.stagehand.browserbase.com/v1",
      );
    });

    it("should return the correct URL for us-east-1", () => {
      expect(getApiUrlForRegion("us-east-1")).toBe(
        "https://api.use1.stagehand.browserbase.com/v1",
      );
    });

    it("should return the correct URL for eu-central-1", () => {
      expect(getApiUrlForRegion("eu-central-1")).toBe(
        "https://api.euc1.stagehand.browserbase.com/v1",
      );
    });

    it("should return the correct URL for ap-southeast-1", () => {
      expect(getApiUrlForRegion("ap-southeast-1")).toBe(
        "https://api.apse1.stagehand.browserbase.com/v1",
      );
    });

    it("should return the default us-west-2 URL when no region is specified", () => {
      expect(getApiUrlForRegion(undefined)).toBe(
        "https://api.stagehand.browserbase.com/v1",
      );
    });

    it("should return the default us-west-2 URL for unknown regions", () => {
      // @ts-expect-error - testing invalid region
      expect(getApiUrlForRegion("invalid-region")).toBe(
        "https://api.stagehand.browserbase.com/v1",
      );
    });
  });

  describe("URL /v1 suffix handling", () => {
    it("getApiUrlForRegion always includes /v1 suffix for consistency", () => {
      // getApiUrlForRegion returns a URL with /v1
      // This documents the expected contract that all API base URLs include /v1
      const url = getApiUrlForRegion("us-west-2");
      expect(url.endsWith("/v1")).toBe(true);
    });

    it("all regional URLs should be base URLs without /v1 in REGION_API_URLS", () => {
      // Verify REGION_API_URLS contains base URLs (without /v1)
      // The /v1 suffix is added by getApiUrlForRegion
      for (const [region, baseUrl] of Object.entries(REGION_API_URLS)) {
        expect(baseUrl.endsWith("/v1")).toBe(false);
        expect(getApiUrlForRegion(region as keyof typeof REGION_API_URLS)).toBe(
          `${baseUrl}/v1`,
        );
      }
    });
  });
});


================================================
FILE: packages/core/tests/unit/browserbase-session-accessors.test.ts
================================================
import { describe, expect, it, vi, beforeEach, afterEach } from "vitest";
import { V3 } from "../../lib/v3/v3.js";

const MOCK_SESSION_ID = "session-123";
const MOCK_SESSION_URL = `https://www.browserbase.com/sessions/${MOCK_SESSION_ID}`;
const MOCK_DEBUG_URL = `https://debug.browserbase.com/${MOCK_SESSION_ID}`;

vi.mock("../../lib/v3/understudy/context", () => {
  class MockConnection {
    onTransportClosed = vi.fn();
    offTransportClosed = vi.fn();
    send = vi.fn(async () => {});
  }

  class MockV3Context {
    static async create(): Promise<MockV3Context> {
      return new MockV3Context();
    }

    conn = new MockConnection();

    pages(): never[] {
      return [];
    }

    async close(): Promise<void> {
      // noop
    }
  }

  return { V3Context: MockV3Context };
});

vi.mock("../../lib/v3/launch/browserbase", () => ({
  createBrowserbaseSession: vi.fn(async () => ({
    ws: "wss://mock-browserbase",
    sessionId: MOCK_SESSION_ID,
    bb: {
      sessions: {
        debug: vi.fn(async () => ({ debuggerUrl: MOCK_DEBUG_URL })),
      },
    },
  })),
}));

vi.mock("../../lib/v3/launch/local", () => ({
  launchLocalChrome: vi.fn(async () => ({
    ws: "ws://local-cdp",
    chrome: { kill: vi.fn(async () => {}) },
  })),
}));

describe("browserbase accessors", () => {
  beforeEach(() => {
    process.env.BROWSERBASE_API_KEY = "fake-key";
    process.env.BROWSERBASE_PROJECT_ID = "fake-project";
  });

  afterEach(() => {
    delete process.env.BROWSERBASE_API_KEY;
    delete process.env.BROWSERBASE_PROJECT_ID;
    vi.clearAllMocks();
  });

  it("exposes Browserbase session and debug URLs after init", async () => {
    const v3 = new V3({
      env: "BROWSERBASE",
      disableAPI: true,
      verbose: 0,
    });

    try {
      await v3.init();

      expect(v3.browserbaseSessionURL).toBe(MOCK_SESSION_URL);
      expect(v3.browserbaseDebugURL).toBe(MOCK_DEBUG_URL);
      expect(v3.isCaptchaAutoSolveEnabled).toBe(true);
    } finally {
      await v3.close().catch(() => {});
    }
  });

  it("clears stored URLs after close", async () => {
    const v3 = new V3({
      env: "BROWSERBASE",
      disableAPI: true,
      verbose: 0,
    });

    await v3.init();
    await v3.close();

    expect(v3.browserbaseSessionURL).toBeUndefined();
    expect(v3.browserbaseDebugURL).toBeUndefined();
  });

  it("disables captcha solving when solveCaptchas is explicitly false", async () => {
    const v3 = new V3({
      env: "BROWSERBASE",
      disableAPI: true,
      verbose: 0,
      browserbaseSessionCreateParams: {
        browserSettings: {
          solveCaptchas: false,
        },
      },
    });

    try {
      await v3.init();
      expect(v3.isCaptchaAutoSolveEnabled).toBe(false);
    } finally {
      await v3.close().catch(() => {});
    }
  });
});

describe("local accessors", () => {
  it("stay empty for LOCAL environments", async () => {
    const v3 = new V3({
      env: "LOCAL",
      disableAPI: true,
      verbose: 0,
      localBrowserLaunchOptions: {
        cdpUrl: "ws://local-existing-session",
      },
    });

    try {
      await v3.init();
      expect(v3.browserbaseSessionURL).toBeUndefined();
      expect(v3.browserbaseDebugURL).toBeUndefined();
    } finally {
      await v3.close().catch(() => {});
    }
  });
});


================================================
FILE: packages/core/tests/unit/cache-llm-resolution.test.ts
================================================
import { describe, expect, it, vi } from "vitest";
import { ActCache } from "../../lib/v3/cache/ActCache.js";
import { AgentCache } from "../../lib/v3/cache/AgentCache.js";
import type { CacheStorage } from "../../lib/v3/cache/CacheStorage.js";
import type { ActHandler } from "../../lib/v3/handlers/actHandler.js";
import type { LLMClient } from "../../lib/v3/llm/LLMClient.js";
import type { Page } from "../../lib/v3/understudy/page.js";
import type { V3Context } from "../../lib/v3/understudy/context.js";
import type {
  ActCacheContext,
  CachedActEntry,
  CachedAgentEntry,
  AgentCacheContext,
  AgentReplayActStep,
} from "../../lib/v3/types/private/index.js";
import type {
  Action,
  AgentResult,
  AvailableModel,
} from "../../lib/v3/types/public/index.js";

function createFakeStorage<T>(entry: T): CacheStorage {
  return {
    enabled: true,
    readJson: vi.fn().mockResolvedValue({ value: entry }),
    writeJson: vi.fn().mockResolvedValue({}),
    directory: "/tmp/cache",
  } as unknown as CacheStorage;
}

describe("Cache LLM client selection", () => {
  it("ActCache uses provided override client during replay", async () => {
    const action: Action = {
      selector: "xpath=/html/body/button",
      description: "click button",
      method: "click",
      arguments: [],
    };

    const entry: CachedActEntry = {
      version: 1,
      instruction: "click button",
      url: "https://example.com",
      variableKeys: [],
      actions: [action],
      actionDescription: "click button",
      message: "done",
    };

    const storage = createFakeStorage(entry);
    const handler = {
      takeDeterministicAction: vi.fn().mockResolvedValue({
        success: true,
        message: "ok",
        actionDescription: "click button",
        actions: [action],
      }),
    } as unknown as ActHandler;
    const defaultClient = { id: "default" } as unknown as LLMClient;
    const overrideClient = { id: "override" } as unknown as LLMClient;

    const cache = new ActCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => handler,
      getDefaultLlmClient: () => defaultClient,
      domSettleTimeoutMs: undefined,
    });

    const context: ActCacheContext = {
      instruction: "click button",
      cacheKey: "abc",
      pageUrl: "https://example.com",
      variableKeys: [],
      variables: undefined,
    };

    const result = await cache.tryReplay(
      context,
      {} as Page,
      undefined,
      overrideClient,
    );

    expect(result?.success).toBe(true);
    expect(handler.takeDeterministicAction).toHaveBeenCalledTimes(1);
    const call = vi.mocked(handler.takeDeterministicAction).mock.calls[0];
    expect(call?.[3]).toBe(overrideClient);
  });

  it("AgentCache uses provided override client during replay", async () => {
    const action: Action = {
      selector: "xpath=/html/body/input",
      description: "type email",
      method: "type",
      arguments: ["test@example.com"],
    };

    const agentStep: AgentReplayActStep = {
      type: "act",
      instruction: "type email",
      actions: [action],
    };

    const entry: CachedAgentEntry = {
      version: 1,
      instruction: "fill form",
      startUrl: "https://example.com",
      options: {},
      configSignature: "sig",
      steps: [agentStep],
      result: { success: true, actions: [] } as AgentResult,
      timestamp: new Date().toISOString(),
    };

    const storage = {
      enabled: true,
      readJson: vi.fn().mockImplementation(async () => ({ value: entry })),
      writeJson: vi.fn().mockResolvedValue({}),
      directory: "/tmp/cache",
    } as unknown as CacheStorage;

    const handler = {
      takeDeterministicAction: vi.fn().mockResolvedValue({
        success: true,
        message: "ok",
        actionDescription: "type email",
        actions: [action],
      }),
    } as unknown as ActHandler;

    const fakePage = {} as Page;
    const ctx = {
      awaitActivePage: vi.fn().mockResolvedValue(fakePage),
    } as unknown as V3Context;

    const defaultClient = { id: "default-agent" } as unknown as LLMClient;
    const overrideClient = { id: "override-agent" } as unknown as LLMClient;

    const cache = new AgentCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => handler,
      getContext: () => ctx,
      getDefaultLlmClient: () => defaultClient,
      getBaseModelName: () => "openai/gpt-4.1-mini" as AvailableModel,
      getSystemPrompt: () => undefined,
      domSettleTimeoutMs: undefined,
      act: vi.fn(),
    });

    const context: AgentCacheContext = {
      instruction: "fill form",
      startUrl: "https://example.com",
      options: {},
      configSignature: "sig",
      cacheKey: "agent-key",
      variableKeys: [],
    };

    const result = await cache.tryReplay(context, overrideClient);

    expect(result?.success).toBe(true);
    expect(handler.takeDeterministicAction).toHaveBeenCalledTimes(1);
    const call = vi.mocked(handler.takeDeterministicAction).mock.calls[0];
    expect(call?.[3]).toBe(overrideClient);
  });

  it("AgentCache replays non-act steps without requiring an override client", async () => {
    const gotoEntry: CachedAgentEntry = {
      version: 1,
      instruction: "navigate home",
      startUrl: "https://example.com/source",
      options: {},
      configSignature: "sig",
      steps: [
        {
          type: "goto",
          url: "https://example.com/target",
          waitUntil: "load",
        },
      ],
      result: { success: true, actions: [] } as AgentResult,
      timestamp: new Date().toISOString(),
    };

    const storage = {
      enabled: true,
      readJson: vi.fn().mockResolvedValue({ value: gotoEntry }),
      writeJson: vi.fn().mockResolvedValue({}),
      directory: "/tmp/cache",
    } as unknown as CacheStorage;

    const handler = {
      takeDeterministicAction: vi.fn(),
    } as unknown as ActHandler;

    const fakePage = { goto: vi.fn() } as unknown as Page;
    const ctx = {
      awaitActivePage: vi.fn().mockResolvedValue(fakePage),
    } as unknown as V3Context;

    const cache = new AgentCache({
      storage,
      logger: vi.fn(),
      getActHandler: () => handler,
      getContext: () => ctx,
      getDefaultLlmClient: () => ({ id: "default" }) as unknown as LLMClient,
      getBaseModelName: () => "openai/gpt-4.1-mini" as AvailableModel,
      getSystemPrompt: () => undefined,
      domSettleTimeoutMs: undefined,
      act: vi.fn(),
    });

    const context: AgentCacheContext = {
      instruction: "navigate home",
      startUrl: "https://example.com/source",
      options: {},
      configSignature: "sig",
      cacheKey: "agent-goto",
      variableKeys: [],
    };

    const result = await cache.tryReplay(context);

    expect(result?.success).toBe(true);
    expect(handler.takeDeterministicAction).not.toHaveBeenCalled();
    expect(fakePage.goto).toHaveBeenCalledWith("https://example.com/target", {
      waitUntil: "load",
    });
  });
});


================================================
FILE: packages/core/tests/unit/captcha-solver.test.ts
================================================
import { describe, expect, it } from "vitest";
import { CaptchaSolver } from "../../lib/v3/agent/utils/captchaSolver.js";

const SOLVING_STARTED = "browserbase-solving-started";
const SOLVING_FINISHED = "browserbase-solving-finished";
const SOLVING_ERRORED = "browserbase-solving-errored";

type ConsoleListener = (message: { text: () => string }) => void;

class MockPage {
  private listeners = new Set<ConsoleListener>();
  public onCalls = 0;
  public offCalls = 0;

  on(event: string, listener: ConsoleListener): void {
    if (event !== "console") return;
    this.onCalls++;
    this.listeners.add(listener);
  }

  off(event: string, listener: ConsoleListener): void {
    if (event !== "console") return;
    this.offCalls++;
    this.listeners.delete(listener);
  }

  emitConsole(text: string): void {
    const message = { text: () => text };
    for (const listener of this.listeners) {
      listener(message);
    }
  }

  listenerCount(): number {
    return this.listeners.size;
  }
}

describe("CaptchaSolver", () => {
  it("resolves all concurrent waiters when a solve finishes", async () => {
    const page = new MockPage();
    const solver = new CaptchaSolver();
    solver.init(async () => page as never);

    await solver.ensureAttached();
    page.emitConsole(SOLVING_STARTED);

    const firstWait = solver.waitIfSolving();
    const secondWait = solver.waitIfSolving();
    await new Promise((resolve) => setTimeout(resolve, 0));

    const sharedWaitPromise = (
      solver as unknown as { waitPromise: Promise<void> | null }
    ).waitPromise;

    expect(sharedWaitPromise).not.toBeNull();
    expect(
      (solver as unknown as { waitPromise: Promise<void> | null }).waitPromise,
    ).toBe(sharedWaitPromise);

    let firstResolved = false;
    let secondResolved = false;
    void firstWait.then(() => {
      firstResolved = true;
    });
    void secondWait.then(() => {
      secondResolved = true;
    });

    await Promise.resolve();
    expect(firstResolved).toBe(false);
    expect(secondResolved).toBe(false);

    page.emitConsole(SOLVING_FINISHED);
    await Promise.all([firstWait, secondWait]);

    expect(firstResolved).toBe(true);
    expect(secondResolved).toBe(true);
    expect(solver.consumeSolveResult()).toEqual({
      solved: true,
      errored: false,
    });
    expect(solver.consumeSolveResult()).toEqual({
      solved: false,
      errored: false,
    });
  });

  it("re-attaches to a new page and settles stale waiters when the active page changes", async () => {
    const firstPage = new MockPage();
    const secondPage = new MockPage();
    let activePage = firstPage;

    const solver = new CaptchaSolver();
    solver.init(async () => activePage as never);

    await solver.ensureAttached();
    firstPage.emitConsole(SOLVING_STARTED);

    const pendingWait = solver.waitIfSolving();
    let settled = false;
    void pendingWait.then(() => {
      settled = true;
    });

    activePage = secondPage;
    await solver.waitIfSolving();
    await pendingWait;

    expect(settled).toBe(true);
    expect(firstPage.offCalls).toBe(1);
    expect(firstPage.listenerCount()).toBe(0);
    expect(secondPage.onCalls).toBe(1);
    expect(secondPage.listenerCount()).toBe(1);
    expect(solver.isSolving()).toBe(false);
  });

  it("surfaces solver errors exactly once per consume", async () => {
    const page = new MockPage();
    const solver = new CaptchaSolver();
    solver.init(async () => page as never);

    await solver.ensureAttached();
    page.emitConsole(SOLVING_STARTED);

    const wait = solver.waitIfSolving();
    page.emitConsole(SOLVING_ERRORED);
    await wait;

    expect(solver.consumeSolveResult()).toEqual({
      solved: false,
      errored: true,
    });
    expect(solver.consumeSolveResult()).toEqual({
      solved: false,
      errored: false,
    });
  });

  it("disposes cleanly while a solve is in progress", async () => {
    const page = new MockPage();
    const solver = new CaptchaSolver();
    solver.init(async () => page as never);

    await solver.ensureAttached();
    page.emitConsole(SOLVING_STARTED);

    const wait = solver.waitIfSolving();
    await new Promise((resolve) => setTimeout(resolve, 0));
    let settled = false;
    void wait.then(() => {
      settled = true;
    });

    solver.dispose();
    await wait;

    expect(settled).toBe(true);
    expect(solver.isSolving()).toBe(false);
    expect(page.listenerCount()).toBe(0);
    expect(solver.consumeSolveResult()).toEqual({
      solved: false,
      errored: false,
    });
  });

  it("marks errored when detached mid-solve due to page change", async () => {
    const firstPage = new MockPage();
    const secondPage = new MockPage();
    let activePage = firstPage;

    const solver = new CaptchaSolver();
    solver.init(async () => activePage as never);

    await solver.ensureAttached();
    firstPage.emitConsole(SOLVING_STARTED);

    const wait = solver.waitIfSolving();

    // Switch to a new page while the solve is in progress
    activePage = secondPage;
    await solver.waitIfSolving();
    await wait;

    // The interrupted solve should be reported as errored
    expect(solver.consumeSolveResult()).toEqual({
      solved: false,
      errored: true,
    });
  });
});


================================================
FILE: packages/core/tests/unit/cdp-connection-close.test.ts
================================================
import { describe, it, expect, afterEach } from "vitest";
import { WebSocketServer, type WebSocket as ServerWebSocket } from "ws";
import { CdpConnection } from "../../lib/v3/understudy/cdp.js";

/**
 * Races a promise against a timeout. Returns "resolved" if the promise
 * settles before the deadline, or "timeout" if it doesn't.
 */
// TODO: dedupe this with the implementation in testUtils.ts after we unify the test directories
function raceTimeout<T>(
  promise: Promise<T>,
  ms: number,
): Promise<T | "timeout"> {
  let timer: ReturnType<typeof setTimeout>;
  const timeout = new Promise<"timeout">((resolve) => {
    timer = setTimeout(() => resolve("timeout"), ms);
  });
  return Promise.race([promise, timeout]).finally(() => clearTimeout(timer));
}

/**
 * Creates a local WebSocket server and connects a CdpConnection to it.
 * Returns the connection plus a handle to the server-side socket.
 */
async function createPair(): Promise<{
  conn: CdpConnection;
  serverSocket: ServerWebSocket;
  wss: WebSocketServer;
}> {
  const wss = new WebSocketServer({ port: 0 });
  const port = (wss.address() as { port: number }).port;

  const serverSocketPromise = new Promise<ServerWebSocket>((resolve) => {
    wss.once("connection", resolve);
  });

  const conn = await CdpConnection.connect(`ws://localhost:${port}`);
  const serverSocket = await serverSocketPromise;

  return { conn, serverSocket, wss };
}

describe("CdpConnection", () => {
  let wss: WebSocketServer | null = null;

  afterEach(async () => {
    if (wss) {
      await new Promise<void>((resolve) => wss!.close(() => resolve()));
      wss = null;
    }
  });

  describe("close() when WebSocket is already closed", () => {
    it("resolves instead of hanging forever", async () => {
      const pair = await createPair();
      wss = pair.wss;

      // Wait for the client-side close event to be fully processed.
      const transportClosed = new Promise<void>((resolve) => {
        pair.conn.onTransportClosed(() => resolve());
      });

      // Simulate the hosted API terminating the Browserbase session:
      // the server closes the WebSocket from its side.
      pair.serverSocket.close();
      await transportClosed;

      // conn.close() on an already-CLOSED WebSocket must resolve.
      // Without the fix it awaits a "close" event that already fired → hangs.
      const result = await raceTimeout(
        pair.conn.close().then(() => "resolved"),
        3_000,
      );

      expect(result).toBe("resolved");
    });
  });

  describe("inflight CDP calls on unexpected close", () => {
    it("rejects pending calls instead of hanging forever", async () => {
      const pair = await createPair();
      wss = pair.wss;

      // Send a CDP command; the mock server will never reply.
      const pending = pair.conn.send("Runtime.evaluate", {
        expression: "1+1",
      });

      // Server terminates the connection while the call is inflight.
      pair.serverSocket.close();

      // The pending promise must reject, not hang.
      const result = await raceTimeout(
        pending.then(() => "resolved").catch(() => "rejected"),
        3_000,
      );

      expect(result).toBe("rejected");
    });
  });
});


================================================
FILE: packages/core/tests/unit/context-extra-http-headers.test.ts
================================================
import { describe, expect, it } from "vitest";
import { V3Context } from "../../lib/v3/understudy/context.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";
import { StagehandSetExtraHTTPHeadersError } from "../../lib/v3/types/public/sdkErrors.js";

type ContextStub = {
  _sessionInit: Set<string>;
  conn: {
    getSession: (id: string) => MockCDPSession | undefined;
  };
  extraHttpHeaders: Record<string, string> | null;
};

const makeContext = (sessions: MockCDPSession[]): ContextStub => {
  const sessionsById = new Map(
    sessions.map((session) => [session.id, session]),
  );
  return {
    _sessionInit: new Set(sessions.map((session) => session.id)),
    conn: {
      getSession: (id: string) => sessionsById.get(id),
    },
    extraHttpHeaders: null,
  };
};

describe("V3Context.setExtraHTTPHeaders", () => {
  const setExtraHTTPHeaders = V3Context.prototype.setExtraHTTPHeaders as (
    this: ContextStub,
    headers: Record<string, string>,
  ) => Promise<void>;

  it("sends headers to all sessions", async () => {
    const sessionA = new MockCDPSession({}, "session-a");
    const sessionB = new MockCDPSession({}, "session-b");
    const ctx = makeContext([sessionA, sessionB]);

    await setExtraHTTPHeaders.call(ctx, {
      "x-stagehand-test": "yes",
    });

    for (const session of [sessionA, sessionB]) {
      expect(session.callsFor("Network.enable").length).toBe(1);
      expect(
        session.callsFor("Network.setExtraHTTPHeaders")[0]?.params,
      ).toEqual({
        headers: { "x-stagehand-test": "yes" },
      });
    }
  });

  it("throws a custom error with session failure details", async () => {
    const sessionA = new MockCDPSession(
      {
        "Network.setExtraHTTPHeaders": () => {
          throw new Error("boom");
        },
      },
      "session-a",
    );
    const sessionB = new MockCDPSession({}, "session-b");
    const ctx = makeContext([sessionA, sessionB]);

    const promise = setExtraHTTPHeaders.call(ctx, {
      "x-stagehand-test": "yes",
    });

    await expect(promise).rejects.toBeInstanceOf(
      StagehandSetExtraHTTPHeadersError,
    );

    try {
      await promise;
    } catch (error) {
      const err = error as StagehandSetExtraHTTPHeadersError;
      expect(err.failures).toHaveLength(1);
      expect(err.failures[0]).toContain("session=session-a");
      expect(err.failures[0]).toContain("boom");
    }

    expect(sessionA.callsFor("Network.setExtraHTTPHeaders").length).toBe(1);
    expect(sessionB.callsFor("Network.setExtraHTTPHeaders").length).toBe(1);
  });
});


================================================
FILE: packages/core/tests/unit/cookies.test.ts
================================================
import { beforeEach, describe, expect, it } from "vitest";
import {
  filterCookies,
  normalizeCookieParams,
  cookieMatchesFilter,
} from "../../lib/v3/understudy/cookies.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";
import type { V3Context } from "../../lib/v3/understudy/context.js";
import { Cookie, CookieParam } from "../../lib/v3/types/public/context.js";

function makeCookie(overrides: Partial<Cookie> = {}): Cookie {
  return {
    name: "sid",
    value: "abc123",
    domain: "example.com",
    path: "/",
    expires: -1,
    httpOnly: false,
    secure: false,
    sameSite: "Lax",
    ...overrides,
  };
}

/** Convert our Cookie type into the shape CDP's Storage.getCookies returns. */
function toCdpCookie(c: Cookie) {
  return {
    name: c.name,
    value: c.value,
    domain: c.domain,
    path: c.path,
    expires: c.expires,
    httpOnly: c.httpOnly,
    secure: c.secure,
    sameSite: c.sameSite,
    size: c.name.length + c.value.length,
    session: c.expires === -1,
    priority: "Medium",
    sameParty: false,
    sourceScheme: "Secure",
    sourcePort: 443,
  };
}

describe("filterCookies", () => {
  const cookies: Cookie[] = [
    makeCookie({ name: "a", domain: "example.com", path: "/", secure: false }),
    makeCookie({
      name: "b",
      domain: ".example.com",
      path: "/app",
      secure: true,
    }),
    makeCookie({ name: "c", domain: "other.com", path: "/", secure: false }),
    makeCookie({
      name: "d",
      domain: "sub.example.com",
      path: "/",
      secure: false,
    }),
  ];

  it("returns all cookies when urls is empty", () => {
    expect(filterCookies(cookies, [])).toEqual(cookies);
  });

  it("filters by domain (exact host match)", () => {
    const result = filterCookies(cookies, ["http://example.com/"]);
    const names = result.map((c) => c.name);
    expect(names).toContain("a");
    // "b" (.example.com) domain-matches but is secure — excluded on http://
    expect(names).not.toContain("b");
    expect(names).not.toContain("c");
    expect(names).not.toContain("d");
  });

  it("filters by domain (dot-prefixed domain matches on https)", () => {
    const result = filterCookies(cookies, ["https://example.com/app/settings"]);
    const names = result.map((c) => c.name);
    expect(names).toContain("a"); // example.com domain match, path "/" prefix
    expect(names).toContain("b"); // .example.com domain match + secure + https
  });

  it("filters by domain (subdomain matches dot-prefixed domain)", () => {
    const result = filterCookies(cookies, ["http://sub.example.com/"]);
    const names = result.map((c) => c.name);
    // "a" (example.com) → prepend dot → .example.com → matches .sub.example.com
    expect(names).toContain("a");
    // "b" (.example.com) domain-matches sub.example.com but is secure — excluded on http://
    expect(names).not.toContain("b");
    expect(names).toContain("d"); // sub.example.com matches exactly
    expect(names).not.toContain("c");
  });

  it("filters by path prefix", () => {
    const result = filterCookies(cookies, ["https://example.com/app/settings"]);
    const names = result.map((c) => c.name);
    expect(names).toContain("a"); // path "/" is a prefix of "/app/settings"
    expect(names).toContain("b"); // path "/app" is a prefix of "/app/settings"
  });

  it("excludes secure cookies for non-https URLs", () => {
    const result = filterCookies(cookies, ["http://example.com/app/page"]);
    const names = result.map((c) => c.name);
    expect(names).toContain("a");
    expect(names).not.toContain("b"); // secure cookie, http URL
  });

  it("allows secure cookies on loopback addresses regardless of protocol", () => {
    const cases = [
      { domain: "localhost", url: "http://localhost/" },
      { domain: "127.0.0.1", url: "http://127.0.0.1/" },
      { domain: "[::1]", url: "http://[::1]/" },
    ];
    for (const { domain, url } of cases) {
      const cookie = makeCookie({ name: "loop", domain, secure: true });
      const result = filterCookies([cookie], [url]);
      expect(result).toHaveLength(1);
      expect(result[0]!.name).toBe("loop");
    }
  });

  it("matches against multiple URLs (union)", () => {
    const result = filterCookies(cookies, [
      "http://example.com/",
      "http://other.com/",
    ]);
    const names = result.map((c) => c.name);
    expect(names).toContain("a");
    expect(names).toContain("c");
  });

  it("returns empty array when no cookies match any URL", () => {
    const result = filterCookies(cookies, ["http://nomatch.dev/"]);
    expect(result).toHaveLength(0);
  });

  it("returns empty array when cookie list is empty", () => {
    const result = filterCookies([], ["http://example.com/"]);
    expect(result).toHaveLength(0);
  });

  it("does not match a sibling subdomain against a host-only domain", () => {
    // Cookie for "api.example.com" should NOT match "www.example.com"
    const apiCookie = makeCookie({ name: "api", domain: "api.example.com" });
    const result = filterCookies([apiCookie], ["http://www.example.com/"]);
    expect(result).toHaveLength(0);
  });

  it("does not match a parent domain against a more specific cookie", () => {
    // Cookie for "sub.example.com" should NOT match "example.com"
    const subCookie = makeCookie({ name: "sub", domain: "sub.example.com" });
    const result = filterCookies([subCookie], ["http://example.com/"]);
    expect(result).toHaveLength(0);
  });

  it("does not match when path does not prefix the URL path", () => {
    const deepCookie = makeCookie({
      name: "deep",
      domain: "example.com",
      path: "/admin",
    });
    const result = filterCookies([deepCookie], ["http://example.com/public"]);
    expect(result).toHaveLength(0);
  });

  it("does not match when cookie path is a string prefix but not a path boundary", () => {
    // "/foo" should NOT match "/foobar" — only "/foo", "/foo/", "/foo/bar"
    const cookie = makeCookie({
      name: "boundary",
      domain: "example.com",
      path: "/foo",
    });
    expect(filterCookies([cookie], ["http://example.com/foobar"])).toHaveLength(
      0,
    );
    expect(filterCookies([cookie], ["http://example.com/foo"])).toHaveLength(1);
    expect(
      filterCookies([cookie], ["http://example.com/foo/bar"]),
    ).toHaveLength(1);
  });

  it("matches root path against any URL path", () => {
    const rootCookie = makeCookie({
      name: "root",
      domain: "example.com",
      path: "/",
    });
    const result = filterCookies(
      [rootCookie],
      ["http://example.com/deeply/nested/page"],
    );
    expect(result).toHaveLength(1);
  });

  it("handles URL with port numbers", () => {
    const c = makeCookie({ name: "port", domain: "localhost", path: "/" });
    const result = filterCookies([c], ["http://localhost:3000/api"]);
    expect(result).toHaveLength(1);
  });

  it("handles URL with query string and fragment", () => {
    const c = makeCookie({ name: "q", domain: "example.com", path: "/" });
    const result = filterCookies(
      [c],
      ["http://example.com/page?q=1&r=2#section"],
    );
    expect(result).toHaveLength(1);
  });

  it("throws CookieValidationError for malformed URL", () => {
    const c = makeCookie({ name: "a", domain: "example.com" });
    expect(() => filterCookies([c], ["not-a-valid-url"])).toThrow(
      /Invalid URL passed to cookies\(\)/,
    );
  });
});

describe("normalizeCookieParams", () => {
  it("passes through cookies with domain+path", () => {
    const input: CookieParam[] = [
      { name: "a", value: "1", domain: "example.com", path: "/" },
    ];
    const result = normalizeCookieParams(input);
    expect(result[0]!.domain).toBe("example.com");
    expect(result[0]!.path).toBe("/");
    expect(result[0]!.url).toBeUndefined();
  });

  it("derives domain, path, and secure from url", () => {
    const input: CookieParam[] = [
      { name: "a", value: "1", url: "https://example.com/app/page" },
    ];
    const result = normalizeCookieParams(input);
    expect(result[0]!.domain).toBe("example.com");
    expect(result[0]!.path).toBe("/app/");
    expect(result[0]!.secure).toBe(true);
    expect(result[0]!.url).toBeUndefined();
  });

  it("sets secure to false for http urls", () => {
    const input: CookieParam[] = [
      { name: "a", value: "1", url: "http://example.com/" },
    ];
    const result = normalizeCookieParams(input);
    expect(result[0]!.secure).toBe(false);
  });

  it("throws when neither url nor domain+path is provided", () => {
    expect(() => normalizeCookieParams([{ name: "a", value: "1" }])).toThrow(
      /must have a url or a domain\/path pair/,
    );
  });

  it("throws when both url and domain are provided", () => {
    expect(() =>
      normalizeCookieParams([
        { name: "a", value: "1", url: "https://x.com/", domain: "x.com" },
      ]),
    ).toThrow(/should have either url or domain/);
  });

  it("throws when both url and path are provided", () => {
    expect(() =>
      normalizeCookieParams([
        { name: "a", value: "1", url: "https://x.com/", path: "/" },
      ]),
    ).toThrow(/should have either url or path/);
  });

  it("throws for invalid expires (negative, not -1)", () => {
    expect(() =>
      normalizeCookieParams([
        { name: "a", value: "1", domain: "x.com", path: "/", expires: -5 },
      ]),
    ).toThrow(/invalid expires/);
  });

  it("allows expires of -1 (session cookie)", () => {
    const result = normalizeCookieParams([
      { name: "a", value: "1", domain: "x.com", path: "/", expires: -1 },
    ]);
    expect(result[0]!.expires).toBe(-1);
  });

  it("allows a positive expires timestamp", () => {
    const future = Math.floor(Date.now() / 1000) + 3600;
    const result = normalizeCookieParams([
      { name: "a", value: "1", domain: "x.com", path: "/", expires: future },
    ]);
    expect(result[0]!.expires).toBe(future);
  });

  it("throws for about:blank url", () => {
    expect(() =>
      normalizeCookieParams([{ name: "a", value: "1", url: "about:blank" }]),
    ).toThrow(/Blank page/);
  });

  it("throws for data: url", () => {
    expect(() =>
      normalizeCookieParams([
        { name: "a", value: "1", url: "data:text/html,hi" },
      ]),
    ).toThrow(/Data URL/);
  });

  it("throws CookieValidationError for malformed url", () => {
    expect(() =>
      normalizeCookieParams([{ name: "a", value: "1", url: "not-a-url" }]),
    ).toThrow(/Cookie "a" has an invalid url/);
  });

  it("throws when sameSite is None but secure is false", () => {
    expect(() =>
      normalizeCookieParams([
        {
          name: "a",
          value: "1",
          domain: "x.com",
          path: "/",
          sameSite: "None",
          secure: false,
        },
      ]),
    ).toThrow(/sameSite: "None" without secure: true/);
  });

  it("throws when sameSite is None and secure is omitted (undefined)", () => {
    // CDP defaults secure to false when omitted, so the browser will reject it.
    expect(() =>
      normalizeCookieParams([
        { name: "a", value: "1", domain: "x.com", path: "/", sameSite: "None" },
      ]),
    ).toThrow(/sameSite: "None" without secure: true/);
  });

  it("does NOT throw when sameSite is None and secure is true", () => {
    const result = normalizeCookieParams([
      {
        name: "a",
        value: "1",
        domain: "x.com",
        path: "/",
        sameSite: "None",
        secure: true,
      },
    ]);
    expect(result[0]!.sameSite).toBe("None");
    expect(result[0]!.secure).toBe(true);
  });

  it("derives root path from URL with no trailing path segments", () => {
    const result = normalizeCookieParams([
      { name: "a", value: "1", url: "https://example.com" },
    ]);
    // URL("https://example.com").pathname is "/", lastIndexOf("/") + 1 = 1 → "/"
    expect(result[0]!.path).toBe("/");
  });

  it("handles URL with port number", () => {
    const result = normalizeCookieParams([
      { name: "a", value: "1", url: "https://localhost:3000/api/v1" },
    ]);
    expect(result[0]!.domain).toBe("localhost");
    expect(result[0]!.path).toBe("/api/");
    expect(result[0]!.secure).toBe(true);
  });

  it("handles URL with query string (ignores query)", () => {
    const result = normalizeCookieParams([
      { name: "a", value: "1", url: "https://example.com/page?q=1" },
    ]);
    expect(result[0]!.domain).toBe("example.com");
    expect(result[0]!.path).toBe("/");
  });

  it("normalises multiple cookies in a single call", () => {
    const result = normalizeCookieParams([
      { name: "a", value: "1", url: "https://one.com/x" },
      { name: "b", value: "2", domain: "two.com", path: "/" },
      { name: "c", value: "3", url: "http://three.com/y/z" },
    ]);
    expect(result).toHaveLength(3);
    expect(result[0]!.domain).toBe("one.com");
    expect(result[1]!.domain).toBe("two.com");
    expect(result[2]!.domain).toBe("three.com");
    expect(result[2]!.secure).toBe(false);
  });

  it("does not mutate the original input array", () => {
    const input: CookieParam[] = [
      { name: "a", value: "1", url: "https://example.com/app" },
    ];
    const frozen = { ...input[0]! };
    normalizeCookieParams(input);
    expect(input[0]).toEqual(frozen);
  });

  it("preserves optional fields that are explicitly set", () => {
    const result = normalizeCookieParams([
      {
        name: "full",
        value: "val",
        domain: "x.com",
        path: "/p",
        expires: 9999999999,
        httpOnly: true,
        secure: true,
        sameSite: "Strict",
      },
    ]);
    const c = result[0]!;
    expect(c.httpOnly).toBe(true);
    expect(c.secure).toBe(true);
    expect(c.sameSite).toBe("Strict");
    expect(c.expires).toBe(9999999999);
  });

  it("allows expires of 0 (epoch — effectively expired)", () => {
    // 0 is a positive-ish edge case; browsers treat it as already expired
    const result = normalizeCookieParams([
      { name: "a", value: "1", domain: "x.com", path: "/", expires: 0 },
    ]);
    expect(result[0]!.expires).toBe(0);
  });

  it("throws on the first invalid cookie in a batch", () => {
    expect(() =>
      normalizeCookieParams([
        { name: "ok", value: "1", domain: "x.com", path: "/" },
        { name: "bad", value: "2" }, // missing url/domain+path
      ]),
    ).toThrow(/Cookie "bad"/);
  });

  it("includes cookie name in every error message", () => {
    const cases = [
      () => normalizeCookieParams([{ name: "NAMED", value: "1" }]),
      () =>
        normalizeCookieParams([
          { name: "NAMED", value: "1", url: "https://x.com/", domain: "x" },
        ]),
      () =>
        normalizeCookieParams([
          { name: "NAMED", value: "1", url: "about:blank" },
        ]),
      () =>
        normalizeCookieParams([
          {
            name: "NAMED",
            value: "1",
            domain: "x.com",
            path: "/",
            sameSite: "None",
            secure: false,
          },
        ]),
    ];
    for (const fn of cases) {
      expect(fn).toThrow(/NAMED/);
    }
  });
});

describe("cookieMatchesFilter", () => {
  const cookie = makeCookie({
    name: "session",
    domain: ".example.com",
    path: "/app",
  });

  it("matches when all filters match (exact strings)", () => {
    expect(
      cookieMatchesFilter(cookie, {
        name: "session",
        domain: ".example.com",
        path: "/app",
      }),
    ).toBe(true);
  });

  it("does not match when name differs", () => {
    expect(cookieMatchesFilter(cookie, { name: "other" })).toBe(false);
  });

  it("does not match when domain differs", () => {
    expect(cookieMatchesFilter(cookie, { domain: "other.com" })).toBe(false);
  });

  it("does not match when path differs", () => {
    expect(cookieMatchesFilter(cookie, { path: "/other" })).toBe(false);
  });

  it("matches with regex name", () => {
    expect(cookieMatchesFilter(cookie, { name: /^sess/ })).toBe(true);
    expect(cookieMatchesFilter(cookie, { name: /^nope/ })).toBe(false);
  });

  it("matches with regex domain", () => {
    expect(cookieMatchesFilter(cookie, { domain: /example\.com$/ })).toBe(true);
    expect(cookieMatchesFilter(cookie, { domain: /^other/ })).toBe(false);
  });

  it("matches with regex path", () => {
    expect(cookieMatchesFilter(cookie, { path: /^\/app/ })).toBe(true);
  });

  it("undefined filters match everything", () => {
    expect(cookieMatchesFilter(cookie, {})).toBe(true);
    expect(cookieMatchesFilter(cookie, { name: undefined })).toBe(true);
  });

  it("requires ALL filters to match (AND logic)", () => {
    // name matches but domain does not
    expect(
      cookieMatchesFilter(cookie, { name: "session", domain: "wrong.com" }),
    ).toBe(false);
  });

  it("handles global regex lastIndex correctly", () => {
    const re = /sess/g;
    re.lastIndex = 999;
    expect(cookieMatchesFilter(cookie, { name: re })).toBe(true);
  });

  it("exact string does not do substring matching", () => {
    // filter name "sess" should NOT match cookie name "session"
    expect(cookieMatchesFilter(cookie, { name: "sess" })).toBe(false);
  });

  it("regex can do substring matching", () => {
    // regex /sess/ SHOULD match cookie name "session" (substring)
    expect(cookieMatchesFilter(cookie, { name: /sess/ })).toBe(true);
  });

  it("works with all three regex filters combined", () => {
    expect(
      cookieMatchesFilter(cookie, {
        name: /^session$/,
        domain: /example/,
        path: /^\/app$/,
      }),
    ).toBe(true);

    // One of three fails
    expect(
      cookieMatchesFilter(cookie, {
        name: /^session$/,
        domain: /example/,
        path: /^\/wrong$/,
      }),
    ).toBe(false);
  });

  it("empty string filter only matches empty cookie property", () => {
    const emptyPathCookie = makeCookie({
      name: "x",
      domain: "a.com",
      path: "",
    });
    expect(cookieMatchesFilter(emptyPathCookie, { path: "" })).toBe(true);
    expect(cookieMatchesFilter(cookie, { path: "" })).toBe(false);
  });

  it("is called once per cookie (no cross-contamination between calls)", () => {
    const c1 = makeCookie({ name: "alpha", domain: "a.com", path: "/" });
    const c2 = makeCookie({ name: "beta", domain: "b.com", path: "/x" });
    const filter = { name: "alpha", domain: "a.com" };
    expect(cookieMatchesFilter(c1, filter)).toBe(true);
    expect(cookieMatchesFilter(c2, filter)).toBe(false);
  });
});

describe("V3Context cookie methods", () => {
  // We test V3Context methods by constructing a minimal instance with a mock
  // CDP connection. V3Context.create() requires a real WebSocket, so we build
  // one via type-casting a MockCDPSession into the `conn` slot.

  // eslint-disable-next-line @typescript-eslint/no-explicit-any
  let V3ContextClass: { prototype: V3Context } & Record<string, any>;

  beforeEach(async () => {
    const mod = await import("../../lib/v3/understudy/context.js");
    V3ContextClass = mod.V3Context as typeof V3ContextClass;
  });

  function makeContext(
    cdpHandlers: Record<string, (params?: Record<string, unknown>) => unknown>,
  ): V3Context {
    const mockConn = new MockCDPSession(cdpHandlers, "root");
    // V3Context stores the connection as `conn` (readonly). We create an
    // object with the real prototype so we get the actual method implementations.
    const ctx = Object.create(V3ContextClass.prototype) as V3Context & {
      conn: MockCDPSession;
    };
    // Assign the mock connection
    Object.defineProperty(ctx, "conn", { value: mockConn, writable: false });
    return ctx;
  }

  function getMockConn(ctx: V3Context): MockCDPSession {
    return (ctx as unknown as { conn: MockCDPSession }).conn;
  }

  describe("cookies()", () => {
    it("returns all cookies from Storage.getCookies", async () => {
      const cdpCookies = [
        toCdpCookie(makeCookie({ name: "a", domain: "example.com" })),
        toCdpCookie(makeCookie({ name: "b", domain: "other.com" })),
      ];
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: cdpCookies }),
      });

      const result = await ctx.cookies();
      expect(result).toHaveLength(2);
      expect(result.map((c) => c.name)).toEqual(["a", "b"]);
    });

    it("filters by URL when provided as string", async () => {
      const cdpCookies = [
        toCdpCookie(makeCookie({ name: "a", domain: "example.com" })),
        toCdpCookie(makeCookie({ name: "b", domain: "other.com" })),
      ];
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: cdpCookies }),
      });

      const result = await ctx.cookies("http://example.com/");
      expect(result).toHaveLength(1);
      expect(result[0]!.name).toBe("a");
    });

    it("filters by URL when provided as array", async () => {
      const cdpCookies = [
        toCdpCookie(makeCookie({ name: "a", domain: "example.com" })),
        toCdpCookie(makeCookie({ name: "b", domain: "other.com" })),
      ];
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: cdpCookies }),
      });

      const result = await ctx.cookies(["http://other.com/"]);
      expect(result).toHaveLength(1);
      expect(result[0]!.name).toBe("b");
    });

    it("defaults sameSite to Lax when CDP returns undefined", async () => {
      const cdpCookie = {
        ...toCdpCookie(makeCookie()),
        sameSite: undefined as string | undefined,
      };
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [cdpCookie] }),
      });

      const result = await ctx.cookies();
      expect(result[0]!.sameSite).toBe("Lax");
    });

    it("returns empty array when browser has no cookies", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [] }),
      });
      const result = await ctx.cookies();
      expect(result).toEqual([]);
    });

    it("maps all CDP cookie fields to our Cookie type", async () => {
      const cdpCookie = toCdpCookie(
        makeCookie({
          name: "full",
          value: "v",
          domain: ".test.com",
          path: "/p",
          expires: 1700000000,
          httpOnly: true,
          secure: true,
          sameSite: "Strict",
        }),
      );
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [cdpCookie] }),
      });

      const result = await ctx.cookies();
      expect(result[0]).toEqual({
        name: "full",
        value: "v",
        domain: ".test.com",
        path: "/p",
        expires: 1700000000,
        httpOnly: true,
        secure: true,
        sameSite: "Strict",
      });
    });

    it("strips extra CDP fields (size, priority, etc.) from result", async () => {
      const cdpCookie = toCdpCookie(makeCookie({ name: "stripped" }));
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [cdpCookie] }),
      });

      const result = await ctx.cookies();
      const keys = Object.keys(result[0]!);
      expect(keys).not.toContain("size");
      expect(keys).not.toContain("priority");
      expect(keys).not.toContain("sourceScheme");
      expect(keys).not.toContain("sourcePort");
    });

    it("calls Storage.getCookies exactly once per invocation", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [] }),
      });

      await ctx.cookies();
      await ctx.cookies("http://example.com");

      const calls = getMockConn(ctx).callsFor("Storage.getCookies");
      expect(calls).toHaveLength(2);
    });
  });

  describe("addCookies()", () => {
    it("sends all cookies in a single Storage.setCookies call", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => ({}),
      });

      await ctx.addCookies([
        { name: "a", value: "1", domain: "example.com", path: "/" },
        { name: "b", value: "2", domain: "other.com", path: "/" },
      ]);

      const calls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(calls).toHaveLength(1);
      expect(calls[0]!.params).toMatchObject({
        cookies: [
          { name: "a", domain: "example.com" },
          { name: "b", domain: "other.com" },
        ],
      });
    });

    it("derives domain/path/secure from url", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => ({}),
      });

      await ctx.addCookies([
        { name: "a", value: "1", url: "https://example.com/app/page" },
      ]);

      const calls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(calls[0]!.params).toMatchObject({
        cookies: [
          { name: "a", domain: "example.com", path: "/app/", secure: true },
        ],
      });
    });

    it("throws when Storage.setCookies fails", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => {
          throw new Error("CDP failure");
        },
      });

      await expect(
        ctx.addCookies([
          { name: "bad", value: "x", domain: "example.com", path: "/" },
        ]),
      ).rejects.toThrow(/Failed to set cookies \["bad"\]/);
    });

    it("throws for sameSite None without secure", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => ({}),
      });

      await expect(
        ctx.addCookies([
          {
            name: "x",
            value: "1",
            domain: "example.com",
            path: "/",
            sameSite: "None",
            secure: false,
          },
        ]),
      ).rejects.toThrow(/sameSite: "None" without secure: true/);
    });

    it("does nothing when passed an empty array", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => ({}),
      });

      await ctx.addCookies([]);

      const calls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(calls).toHaveLength(0);
    });

    it("sends all cookie fields to CDP (including optional ones)", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => ({}),
      });

      await ctx.addCookies([
        {
          name: "full",
          value: "val",
          domain: "x.com",
          path: "/p",
          expires: 9999999999,
          httpOnly: true,
          secure: true,
          sameSite: "Strict",
        },
      ]);

      const calls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(calls[0]!.params).toEqual({
        cookies: [
          {
            name: "full",
            value: "val",
            domain: "x.com",
            path: "/p",
            expires: 9999999999,
            httpOnly: true,
            secure: true,
            sameSite: "Strict",
          },
        ],
      });
    });

    it("error message includes all cookie names when batch fails", async () => {
      const ctx = makeContext({
        "Storage.setCookies": () => {
          throw new Error("CDP failure");
        },
      });

      await expect(
        ctx.addCookies([
          { name: "alpha", value: "1", domain: "a.com", path: "/" },
          { name: "beta", value: "2", domain: "b.com", path: "/" },
        ]),
      ).rejects.toThrow(/Failed to set cookies \["alpha", "beta"\]/);
    });
  });

  describe("clearCookies()", () => {
    const cdpCookies = [
      toCdpCookie(
        makeCookie({ name: "session", domain: "example.com", path: "/" }),
      ),
      toCdpCookie(
        makeCookie({ name: "_ga", domain: ".example.com", path: "/" }),
      ),
      toCdpCookie(
        makeCookie({ name: "pref", domain: "other.com", path: "/settings" }),
      ),
    ];

    it("uses atomic Storage.clearCookies when called with no options", async () => {
      const ctx = makeContext({
        "Storage.clearCookies": () => ({}),
      });

      await ctx.clearCookies();

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(1);

      // Should NOT have fetched or re-set anything
      const getCalls = getMockConn(ctx).callsFor("Storage.getCookies");
      expect(getCalls).toHaveLength(0);
      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(0);
    });

    it("clears and re-adds only non-matching cookies (name filter)", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ name: "_ga" });

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(1);

      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(1);
      const kept = (
        setCalls[0]!.params?.cookies as Array<{ name: string }>
      ).map((c) => c.name);
      expect(kept).toEqual(["session", "pref"]);
    });

    it("clears and re-adds only non-matching cookies (domain filter)", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ domain: "other.com" });

      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      const kept = (
        setCalls[0]!.params?.cookies as Array<{ name: string }>
      ).map((c) => c.name);
      expect(kept).toEqual(["session", "_ga"]);
    });

    it("clears and re-adds only non-matching cookies (regex name)", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ name: /^_ga/ });

      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      const kept = (
        setCalls[0]!.params?.cookies as Array<{ name: string }>
      ).map((c) => c.name);
      expect(kept).toEqual(["session", "pref"]);
    });

    it("applies AND logic across multiple filters", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ name: "session", domain: "example.com" });

      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      const kept = (
        setCalls[0]!.params?.cookies as Array<{ name: string }>
      ).map((c) => c.name);
      expect(kept).toEqual(["_ga", "pref"]);
    });

    it("does nothing when filter matches no cookies", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ name: "nonexistent" });

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(0);
      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(0);
    });

    it("clears without re-adding when filter matches all cookies", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ name: /.*/ });

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(1);
      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(0);
    });

    it("handles regex that matches multiple cookies", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({
          cookies: [
            toCdpCookie(
              makeCookie({ name: "_ga_ABC", domain: "example.com", path: "/" }),
            ),
            toCdpCookie(
              makeCookie({ name: "_ga_DEF", domain: "example.com", path: "/" }),
            ),
            toCdpCookie(
              makeCookie({ name: "_gid", domain: "example.com", path: "/" }),
            ),
            toCdpCookie(
              makeCookie({ name: "session", domain: "example.com", path: "/" }),
            ),
          ],
        }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ name: /^_ga/ });

      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      const kept = (
        setCalls[0]!.params?.cookies as Array<{ name: string }>
      ).map((c) => c.name);
      expect(kept).toContain("_gid");
      expect(kept).toContain("session");
      expect(kept).not.toContain("_ga_ABC");
      expect(kept).not.toContain("_ga_DEF");
    });

    it("regex domain filter combined with path filter", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ domain: /example/, path: "/settings" });

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(0);
      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(0);
    });

    it("clearCookies with empty options object uses atomic clear (same as no args)", async () => {
      const ctx = makeContext({
        "Storage.clearCookies": () => ({}),
      });

      await ctx.clearCookies({});

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(1);
    });

    it("clears and re-adds only non-matching cookies (path filter)", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await ctx.clearCookies({ path: "/settings" });

      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(1);

      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(1);
      const kept = (
        setCalls[0]!.params?.cookies as Array<{ name: string }>
      ).map((c) => c.name);
      expect(kept).toEqual(["session", "_ga"]);
      expect(kept).not.toContain("pref");
    });

    it("throws when Storage.getCookies fails during filtered clear", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => {
          throw new Error("CDP getCookies failure");
        },
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => ({}),
      });

      await expect(ctx.clearCookies({ name: "session" })).rejects.toThrow(
        /CDP getCookies failure/,
      );

      // clearCookies and setCookies should never have been called
      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(0);
      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(0);
    });

    it("throws when Storage.clearCookies fails during filtered clear", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => {
          throw new Error("CDP clearCookies failure");
        },
        "Storage.setCookies": () => ({}),
      });

      await expect(ctx.clearCookies({ name: "session" })).rejects.toThrow(
        /CDP clearCookies failure/,
      );

      // setCookies should never have been called — cookies are untouched
      const setCalls = getMockConn(ctx).callsFor("Storage.setCookies");
      expect(setCalls).toHaveLength(0);
    });

    it("throws when Storage.setCookies fails during re-add, cookies are already wiped", async () => {
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [...cdpCookies] }),
        "Storage.clearCookies": () => ({}),
        "Storage.setCookies": () => {
          throw new Error("CDP setCookies failure");
        },
      });

      await expect(ctx.clearCookies({ name: "session" })).rejects.toThrow(
        /cookie jar is now empty/,
      );

      // clearCookies WAS called — cookies are gone
      const clearCalls = getMockConn(ctx).callsFor("Storage.clearCookies");
      expect(clearCalls).toHaveLength(1);
    });
  });

  describe("cookies() sameSite mapping", () => {
    it("passes through valid sameSite values as-is", async () => {
      for (const sameSite of ["Strict", "Lax", "None"] as const) {
        const cdpCookie = { ...toCdpCookie(makeCookie()), sameSite };
        const ctx = makeContext({
          "Storage.getCookies": () => ({ cookies: [cdpCookie] }),
        });
        const result = await ctx.cookies();
        expect(result[0]!.sameSite).toBe(sameSite);
      }
    });

    it("does not normalize lowercase sameSite values from CDP", async () => {
      // CDP may return lowercase values; the current implementation casts
      // without normalizing, so "none" passes through as-is.
      const cdpCookie = { ...toCdpCookie(makeCookie()), sameSite: "none" };
      const ctx = makeContext({
        "Storage.getCookies": () => ({ cookies: [cdpCookie] }),
      });
      const result = await ctx.cookies();
      // This documents the current behavior: lowercase is NOT normalized.
      expect(result[0]!.sameSite).toBe("none");
    });
  });
});


================================================
FILE: packages/core/tests/unit/flowlogger-capturing-cdp.test.ts
================================================
import { EventEmitter } from "node:events";
import { describe, it, expect } from "vitest";
import { CdpConnection } from "../../lib/v3/understudy/cdp.js";
import { InMemoryEventSink } from "../../lib/v3/flowlogger/EventSink.js";
import { EventEmitterWithWildcardSupport } from "../../lib/v3/flowlogger/EventEmitter.js";
import { EventStore } from "../../lib/v3/flowlogger/EventStore.js";
import { FlowEvent, FlowLogger } from "../../lib/v3/flowlogger/FlowLogger.js";

function attachEventStoreToBus(
  store: EventStore,
  bus: EventEmitterWithWildcardSupport,
): () => void {
  const onFlowEvent = (event: unknown) => {
    if (event instanceof FlowEvent) {
      void store.emit(event);
    }
  };

  bus.on("*", onFlowEvent);
  return () => {
    bus.off("*", onFlowEvent);
  };
}

class FakeSocket extends EventEmitter {
  sentPayloads: string[] = [];
  readyState = 1;

  send(payload: string): void {
    this.sentPayloads.push(payload);
  }

  close(): void {
    this.readyState = 3;
    this.emit("close", 1000, "");
  }
}

function createConnection(socket: FakeSocket): CdpConnection {
  // The production constructor is private; tests instantiate it directly so
  // they can drive raw websocket messages without a real browser.
  const ConnectionCtor = CdpConnection as unknown as {
    new (ws: FakeSocket): CdpConnection;
  };
  return new ConnectionCtor(socket);
}

function requireEvent(
  events: FlowEvent[],
  predicate: (event: FlowEvent) => boolean,
  description: string,
): FlowEvent {
  const match = events.find(predicate);
  expect(match, `missing ${description}`).toBeDefined();
  return match as FlowEvent;
}

describe("flow logger cdp context", () => {
  it("preserves the active parent chain when a session event handler issues a nested CDP call", async () => {
    const sessionId = "session-test";
    const socket = new FakeSocket();
    const eventBus = new EventEmitterWithWildcardSupport();
    const sink = new InMemoryEventSink();
    const eventStore = new EventStore(sessionId, undefined, sink);

    const detachBus = attachEventStoreToBus(eventStore, eventBus);

    const conn = createConnection(socket);
    conn.flowLoggerContext = FlowLogger.init(sessionId, eventBus);

    // Seed the target/session mapping the same way a real attach flow would
    // before any session-scoped messages are dispatched.
    (conn as unknown as { onMessage(json: string): void }).onMessage(
      JSON.stringify({
        method: "Target.attachedToTarget",
        params: {
          sessionId: "target-session",
          targetInfo: { targetId: "target-1" },
        },
      }),
    );

    const session = conn.getSession("target-session");
    expect(session).toBeDefined();

    session!.on("Runtime.consoleAPICalled", () => {
      // This nested send used to lose its parent chain because the callback ran
      // after the original ALS scope had already unwound.
      void session!.send("Runtime.evaluate", {
        expression: "2 + 2",
      });
    });

    await FlowLogger.runWithLogging(
      {
        context: conn.flowLoggerContext,
        eventType: "SyntheticParentEvent",
      },
      async () => {
        void session!.send("Page.navigate", {
          url: "https://example.com",
        });
      },
      [],
    );

    (conn as unknown as { onMessage(json: string): void }).onMessage(
      JSON.stringify({
        method: "Runtime.consoleAPICalled",
        sessionId: "target-session",
        params: { type: "log" },
      }),
    );

    // The nested Runtime.evaluate call should still attach under the synthetic
    // parent event even though it was triggered by a later session callback.
    const events = await eventStore.query({});
    const parentEvent = requireEvent(
      events,
      (event) => event.eventType === "SyntheticParentEvent",
      "SyntheticParentEvent",
    );
    const nestedCallEvent = requireEvent(
      events,
      (event) =>
        event.eventType === "CdpCallEvent" &&
        String(event.data.method) === "Runtime.evaluate",
      "nested Runtime.evaluate CdpCallEvent",
    );

    expect(nestedCallEvent.eventParentIds).toEqual([parentEvent.eventId]);

    detachBus();
    await eventStore.destroy();
  });
});


================================================
FILE: packages/core/tests/unit/flowlogger-capturing-llm.test.ts
================================================
import { describe, expect, it } from "vitest";
import { FlowLogger } from "../../lib/v3/flowlogger/FlowLogger.js";

describe("flow logger llm logging", () => {
  it("no-ops direct llm logging calls when no flow context is active", () => {
    // These helpers are called from multiple model adapters, so they must stay
    // safe even when a test or utility invokes them outside any ALS flow scope.
    expect(() =>
      FlowLogger.logLlmRequest({
        requestId: "req-1",
        model: "mock-model",
        prompt: "hello",
      }),
    ).not.toThrow();

    expect(() =>
      FlowLogger.logLlmResponse({
        requestId: "req-1",
        model: "mock-model",
        output: "world",
        inputTokens: 1,
        outputTokens: 1,
      }),
    ).not.toThrow();
  });

  it("does not throw from llm middleware when no flow context is active", async () => {
    const middleware = FlowLogger.createLlmLoggingMiddleware("mock-model");

    // Missing flow context should degrade to a silent no-op and preserve the
    // underlying model result.
    await expect(
      middleware.wrapGenerate({
        doGenerate: async () => ({
          text: "done",
          usage: {
            inputTokens: 1,
            outputTokens: 1,
            totalTokens: 2,
          },
        }),
        params: {
          prompt: [],
        },
      } as never),
    ).resolves.toMatchObject({
      text: "done",
    });
  });
});


================================================
FILE: packages/core/tests/unit/flowlogger-eventstore.test.ts
================================================
import { afterEach, describe, expect, it } from "vitest";
import { EventStore } from "../../lib/v3/flowlogger/EventStore.js";
import { EventEmitterWithWildcardSupport } from "../../lib/v3/flowlogger/EventEmitter.js";
import { FlowEvent } from "../../lib/v3/flowlogger/FlowLogger.js";

function attachEventStoreToBus(
  store: EventStore,
  bus: EventEmitterWithWildcardSupport,
): () => void {
  const onFlowEvent = (event: unknown) => {
    if (event instanceof FlowEvent) {
      void store.emit(event);
    }
  };

  bus.on("*", onFlowEvent);
  return () => {
    bus.off("*", onFlowEvent);
  };
}

function createVerboseStoreHarness(): {
  writes: string[];
  store: EventStore;
  bus: EventEmitterWithWildcardSupport;
  detachBus: () => void;
} {
  const writes: string[] = [];
  process.stderr.write = ((
    chunk: string,
    cb?: (error?: Error | null) => void,
  ) => {
    writes.push(String(chunk));
    cb?.(null);
    return true;
  }) as typeof process.stderr.write;

  const store = new EventStore("session-test");
  const bus = new EventEmitterWithWildcardSupport();
  const detachBus = attachEventStoreToBus(store, bus);

  return { writes, store, bus, detachBus };
}

describe("flow logger event store", () => {
  const stderrWrite = process.stderr.write.bind(process.stderr);

  afterEach(() => {
    process.stderr.write = stderrWrite;
  });

  it("queries recent events from the default in-memory sink", async () => {
    const store = new EventStore("session-test");

    await store.emit(
      new FlowEvent({
        eventType: "StagehandExtractEvent",
        sessionId: "session-test",
        eventId: "stagehand-1234",
        eventCreatedAt: "2026-03-16T21:45:00.000Z",
        data: { params: ["grab title"] },
      }),
    );

    const events = await store.query({});
    expect(events).toHaveLength(1);
    expect(events[0].eventType).toBe("StagehandExtractEvent");

    await store.destroy();
  });

  it("drops payloads from the default in-memory sink", async () => {
    const store = new EventStore("session-test");

    await store.emit(
      new FlowEvent({
        eventType: "LlmRequestEvent",
        sessionId: "session-test",
        eventId: "llm-1234",
        eventCreatedAt: "2026-03-16T21:45:00.000Z",
        data: {
          prompt: [{ type: "image_url", image_url: { url: "huge" } }],
          output: "huge",
        },
      }),
    );

    const [event] = await store.query({});
    expect(event.eventType).toBe("LlmRequestEvent");
    expect(event.eventId).toBe("llm-1234");
    expect(event.data).toEqual({});

    await store.destroy();
  });

  it("renders semantic hierarchy tags for non-cdp stderr events only", async () => {
    // Intercept stderr so the pretty sink can be asserted without polluting the
    // real test runner output.
    const { writes, store, bus, detachBus } = createVerboseStoreHarness();

    const stepEvent = new FlowEvent({
      eventType: "StagehandExtractEvent",
      sessionId: "session-test",
      eventId: "stagehand-1234",
      eventCreatedAt: "2026-03-16T21:45:00.000Z",
      data: { params: ["grab title"] },
    });
    const cdpEvent = new FlowEvent({
      eventType: "CdpCallEvent",
      sessionId: "session-test",
      eventId: "cdp-call-5678",
      eventCreatedAt: "2026-03-16T21:45:00.100Z",
      eventParentIds: [stepEvent.eventId],
      data: {
        method: "Runtime.evaluate",
        params: { expression: "2 + 2" },
        targetId: "1234567890ABCDEF1234567890ABCDEF",
      },
    });

    // The stderr sink intentionally suppresses CDP noise even though the event
    // still exists for in-memory and file-backed sinks.
    bus.emit(stepEvent.eventType, stepEvent);
    bus.emit(cdpEvent.eventType, cdpEvent);
    await new Promise((resolve) => setTimeout(resolve, 0));

    expect(writes).toHaveLength(1);
    expect(writes[0]).toContain("[🆂 #1234 EXTRACT]");
    expect(writes[0]).toContain("Stagehand.extract");
    expect(writes[0]).not.toContain("Runtime.evaluate");

    detachBus();
    await store.destroy();
  });

  it("renders generic stagehand events without crashing the stderr sink", async () => {
    const { writes, store, bus, detachBus } = createVerboseStoreHarness();

    // `StagehandEvent` has no action suffix, so this guards the formatter path
    // that cannot assume a method name exists.
    bus.emit(
      "StagehandEvent",
      new FlowEvent({
        eventType: "StagehandEvent",
        sessionId: "session-test",
        eventId: "stagehand-0001",
        eventCreatedAt: "2026-03-16T21:45:00.000Z",
        data: { params: ["noop"] },
      }),
    );
    await new Promise((resolve) => setTimeout(resolve, 0));

    expect(writes).toHaveLength(1);
    expect(writes[0]).toContain("[🆂 #0001");
    expect(writes[0]).toContain("Stagehand(");

    detachBus();
    await store.destroy();
  });

  it("colorizes pretty stderr output with ansi escapes when enabled", async () => {
    const previousForceColor = process.env.FORCE_COLOR;
    const previousNoColor = process.env.NO_COLOR;
    delete process.env.NO_COLOR;
    process.env.FORCE_COLOR = "1";

    const { writes, store, bus, detachBus } = createVerboseStoreHarness();

    try {
      bus.emit(
        "StagehandActEvent",
        new FlowEvent({
          eventType: "StagehandActEvent",
          sessionId: "session-test",
          eventId: "stagehand-0002",
          eventCreatedAt: "2026-03-16T21:45:00.000Z",
          data: { params: ["click submit"] },
        }),
      );
      await new Promise((resolve) => setTimeout(resolve, 0));

      expect(writes).toHaveLength(1);
      expect(writes[0]).toContain("\u001B[");
    } finally {
      if (previousNoColor === undefined) {
        delete process.env.NO_COLOR;
      } else {
        process.env.NO_COLOR = previousNoColor;
      }

      if (previousForceColor === undefined) {
        delete process.env.FORCE_COLOR;
      } else {
        process.env.FORCE_COLOR = previousForceColor;
      }

      detachBus();
      await store.destroy();
    }
  });

  it("keeps agent ancestry and start ids for completion events after many child events", async () => {
    const { writes, store, bus, detachBus } = createVerboseStoreHarness();

    const agentEvent = new FlowEvent({
      eventType: "AgentExecuteEvent",
      sessionId: "session-test",
      eventId: "agent-1234",
      eventCreatedAt: "2026-03-16T21:45:00.000Z",
      data: { params: [{ instruction: "click the button" }] },
    });
    const actEvent = new FlowEvent({
      eventType: "StagehandActEvent",
      sessionId: "session-test",
      eventId: "stagehand-2222",
      eventCreatedAt: "2026-03-16T21:45:00.001Z",
      eventParentIds: [agentEvent.eventId],
      data: { params: ["click the button"] },
    });
    const clickEvent = new FlowEvent({
      eventType: "UnderstudyClickEvent",
      sessionId: "session-test",
      eventId: "action-3333",
      eventCreatedAt: "2026-03-16T21:45:00.002Z",
      eventParentIds: [agentEvent.eventId, actEvent.eventId],
      data: { target: "xpath=/button[1]" },
    });

    bus.emit(agentEvent.eventType, agentEvent);
    bus.emit(actEvent.eventType, actEvent);
    bus.emit(clickEvent.eventType, clickEvent);

    // Flood the retained history with child events so the completion lines have
    // to recover their displayed ancestry from the queryable sink.
    for (let index = 0; index < 150; index += 1) {
      bus.emit(
        "CdpCallEvent",
        new FlowEvent({
          eventType: "CdpCallEvent",
          sessionId: "session-test",
          eventId: `cdp-${String(index).padStart(4, "0")}`,
          eventCreatedAt: `2026-03-16T21:45:00.${String(index + 10).padStart(3, "0")}Z`,
          eventParentIds: [
            agentEvent.eventId,
            actEvent.eventId,
            clickEvent.eventId,
          ],
          data: {
            method: "Runtime.evaluate",
            params: { expression: `${index}` },
            targetId: "1234567890ABCDEF1234567890ABCDEF",
          },
        }),
      );
    }

    bus.emit(
      "UnderstudyClickCompletedEvent",
      new FlowEvent({
        eventType: "UnderstudyClickCompletedEvent",
        sessionId: "session-test",
        eventId: "done-4444",
        eventCreatedAt: "2026-03-16T21:45:01.000Z",
        eventParentIds: [
          agentEvent.eventId,
          actEvent.eventId,
          clickEvent.eventId,
        ],
        data: { durationMs: 250 },
      }),
    );
    bus.emit(
      "StagehandActCompletedEvent",
      new FlowEvent({
        eventType: "StagehandActCompletedEvent",
        sessionId: "session-test",
        eventId: "done-5555",
        eventCreatedAt: "2026-03-16T21:45:01.001Z",
        eventParentIds: [agentEvent.eventId, actEvent.eventId],
        data: { durationMs: 500 },
      }),
    );
    bus.emit(
      "AgentExecuteCompletedEvent",
      new FlowEvent({
        eventType: "AgentExecuteCompletedEvent",
        sessionId: "session-test",
        eventId: "done-6666",
        eventCreatedAt: "2026-03-16T21:45:01.002Z",
        eventParentIds: [agentEvent.eventId],
        data: { durationMs: 750 },
      }),
    );
    await new Promise((resolve) => setTimeout(resolve, 0));

    // Completion lines should reference the original started-event ids, not the
    // synthetic completed-event ids emitted at the end of the lifecycle.
    const clickCompletedLine = writes.find((line) =>
      line.includes("CLICK completed"),
    );
    const actCompletedLine = writes.find((line) =>
      line.includes("ACT completed"),
    );
    const agentCompletedLine = writes.find((line) =>
      line.includes("Agent.execute() completed"),
    );

    expect(clickCompletedLine).toContain("[🅰 #1234]");
    expect(clickCompletedLine).toContain("[🆂 #2222 ACT]");
    expect(clickCompletedLine).toContain("[🆄 #3333 CLICK]");
    expect(clickCompletedLine).not.toContain("#4444");

    expect(actCompletedLine).toContain("[🅰 #1234]");
    expect(actCompletedLine).toContain("[🆂 #2222 ACT]");
    expect(actCompletedLine).not.toContain("#5555");

    expect(agentCompletedLine).toContain("[🅰 #1234]");
    expect(agentCompletedLine).not.toContain("#6666");

    detachBus();
    await store.destroy();
  });
});


================================================
FILE: packages/core/tests/unit/helpers/mockCDPSession.ts
================================================
import type { CDPSessionLike } from "../../../lib/v3/understudy/cdp.js";

type Handler = (params?: Record<string, unknown>) => Promise<unknown> | unknown;

export class MockCDPSession implements CDPSessionLike {
  public readonly id: string;
  public readonly calls: Array<{
    method: string;
    params?: Record<string, unknown>;
  }> = [];

  constructor(
    private readonly handlers: Record<string, Handler> = {},
    sessionId = "mock-session",
  ) {
    this.id = sessionId;
  }

  async send<R = unknown>(
    method: string,
    params: Record<string, unknown> = {},
  ): Promise<R> {
    this.calls.push({ method, params });
    const handler = this.handlers[method];
    if (!handler) return {} as R;
    return (await handler(params)) as R;
  }

  on(): void {}
  off(): void {}
  async close(): Promise<void> {}

  callsFor(method: string): Array<{ params?: Record<string, unknown> }> {
    return this.calls
      .filter((call) => call.method === method)
      .map(({ params }) => ({ params }));
  }
}


================================================
FILE: packages/core/tests/unit/llm-provider.test.ts
================================================
import { describe, expect, it } from "vitest";
import { getAISDKLanguageModel } from "../../lib/v3/llm/LLMProvider.js";

describe("getAISDKLanguageModel", () => {
  describe("ollama provider", () => {
    it("works without clientOptions", () => {
      const model = getAISDKLanguageModel("ollama", "llama3.2");
      expect(model).toBeDefined();
    });

    it("works with empty clientOptions", () => {
      const model = getAISDKLanguageModel("ollama", "llama3.2", {});
      expect(model).toBeDefined();
    });

    it("works with clientOptions containing only undefined values", () => {
      const model = getAISDKLanguageModel("ollama", "llama3.2", {
        apiKey: undefined,
      });
      expect(model).toBeDefined();
    });

    it("works with clientOptions containing only null values", () => {
      const model = getAISDKLanguageModel("ollama", "llama3.2", {
        apiKey: null as unknown as string,
      });
      expect(model).toBeDefined();
    });

    it("works with custom baseURL", () => {
      const model = getAISDKLanguageModel("ollama", "llama3.2", {
        baseURL: "http://custom-ollama:11434",
      });
      expect(model).toBeDefined();
    });

    it("works even when apiKey is mistakenly provided", () => {
      // Ollama doesn't need an API key, but users might set one anyway
      const model = getAISDKLanguageModel("ollama", "llama3.2", {
        apiKey: "unnecessary-key",
      });
      expect(model).toBeDefined();
    });
  });

  describe("providers with API keys", () => {
    it("openai requires valid clientOptions for custom configuration", () => {
      // Without clientOptions, uses default provider
      const defaultModel = getAISDKLanguageModel("openai", "gpt-4o");
      expect(defaultModel).toBeDefined();

      // With valid apiKey, uses custom provider
      const customModel = getAISDKLanguageModel("openai", "gpt-4o", {
        apiKey: "test-key",
      });
      expect(customModel).toBeDefined();
    });
  });

  describe("hasValidOptions logic", () => {
    it("treats undefined apiKey as no options", () => {
      // This should use the default provider path (AISDKProviders)
      // not the custom provider path (AISDKProvidersWithAPIKey)
      const model = getAISDKLanguageModel("ollama", "llama3.2", {
        apiKey: undefined,
      });
      expect(model).toBeDefined();
    });
  });
});


================================================
FILE: packages/core/tests/unit/model-deprecation.test.ts
================================================
import { describe, expect, it } from "vitest";
import { LLMProvider } from "../../lib/v3/llm/LLMProvider.js";
import {
  UnsupportedModelError,
  UnsupportedAISDKModelProviderError,
} from "../../lib/v3/types/public/sdkErrors.js";
import type { LogLine } from "../../lib/v3/types/public/logs.js";

// Mock client options with fake API keys for testing
const mockClientOptions = { apiKey: "test-api-key-for-testing" };

describe("Model format deprecation", () => {
  describe("UnsupportedModelError", () => {
    it("includes guidance to use provider/model format for unknown model names", () => {
      const error = new UnsupportedModelError(["gpt-4o", "gemini-2.0-flash"]);

      // Should mention the new format
      expect(error.message).toContain("provider/model");
      // Should include link to docs
      expect(error.message).toContain(
        "https://docs.stagehand.dev/v3/configuration/models",
      );
    });

    it("includes example of provider/model format", () => {
      const error = new UnsupportedModelError(["gpt-4o"]);

      // Should provide examples like openai/gpt-4o
      expect(error.message).toContain("openai/gpt-4o");
      expect(error.message).toContain("anthropic/claude-sonnet-4");
    });

    it("works with feature parameter", () => {
      const error = new UnsupportedModelError(["gpt-4o"], "extract");

      expect(error.message).toContain("extract");
      expect(error.message).toContain("provider/model");
      expect(error.message).toContain(
        "https://docs.stagehand.dev/v3/configuration/models",
      );
    });
  });

  describe("LLMProvider.getClient deprecation warning", () => {
    it("logs deprecation warning for legacy model names", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      // Using a legacy model name like "gpt-4o" instead of "openai/gpt-4o"
      // Should not throw, but should log a deprecation warning
      const client = provider.getClient("gpt-4o", mockClientOptions);

      // Should return a client (not throw)
      expect(client).toBeDefined();

      // Should have logged a deprecation warning at level 0
      const deprecationWarning = logs.find(
        (log) =>
          log.message.toLowerCase().includes("deprecated") ||
          log.message.toLowerCase().includes("deprecation"),
      );
      expect(deprecationWarning).toBeDefined();
      expect(deprecationWarning!.level).toBe(0);
    });

    it("deprecation warning mentions provider/model format", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      provider.getClient("gpt-4o", mockClientOptions);

      const deprecationWarning = logs.find(
        (log) =>
          log.message.toLowerCase().includes("deprecated") ||
          log.message.toLowerCase().includes("deprecation"),
      );

      expect(deprecationWarning).toBeDefined();
      const message = deprecationWarning!.message;
      // Should mention the provider/model format
      expect(message).toContain("provider/model");
      // Should give an example
      expect(message).toContain("openai/gpt-5");
    });

    it("returns OpenAIClient for legacy OpenAI model names", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      const client = provider.getClient("gpt-4o", mockClientOptions);

      // Should return a client
      expect(client).toBeDefined();
      // The client should be an OpenAIClient (check constructor name)
      expect(client.constructor.name).toBe("OpenAIClient");
    });

    it("returns GoogleClient for legacy Google model names", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      const client = provider.getClient("gemini-2.0-flash", mockClientOptions);

      // Should return a client
      expect(client).toBeDefined();
      // The client should be a GoogleClient
      expect(client.constructor.name).toBe("GoogleClient");
    });
  });

  describe("LLMProvider.getClient error handling", () => {
    it("throws UnsupportedModelError for unknown model without slash", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      // Unknown model without slash should throw UnsupportedModelError
      expect(() => {
        provider.getClient("some-unknown-model", mockClientOptions);
      }).toThrow(UnsupportedModelError);
    });

    it("UnsupportedModelError includes provider/model format guidance", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      try {
        provider.getClient("some-unknown-model", mockClientOptions);
      } catch (error) {
        expect((error as Error).message).toContain("provider/model");
      }
    });

    it("throws UnsupportedAISDKModelProviderError for invalid provider in provider/model format", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      // Invalid provider but correct format
      expect(() => {
        provider.getClient("invalid-provider/some-model", mockClientOptions);
      }).toThrow(UnsupportedAISDKModelProviderError);
    });

    it("UnsupportedAISDKModelProviderError lists valid providers", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      try {
        provider.getClient("invalid-provider/some-model", mockClientOptions);
      } catch (error) {
        const message = (error as Error).message;
        // Should list valid providers
        expect(message).toContain("openai");
        expect(message).toContain("anthropic");
        expect(message).toContain("google");
      }
    });
  });

  describe("new provider/model format", () => {
    it("does not log deprecation warning for provider/model format", () => {
      const logs: LogLine[] = [];
      const logger = (line: LogLine) => logs.push(line);
      const provider = new LLMProvider(logger);

      // Using the new format
      const client = provider.getClient("openai/gpt-4o", mockClientOptions);

      expect(client).toBeDefined();

      // Should NOT have a deprecation warning
      const deprecationWarning = logs.find(
        (log) =>
          log.message.toLowerCase().includes("deprecated") ||
          log.message.toLowerCase().includes("deprecation"),
      );
      expect(deprecationWarning).toBeUndefined();
    });
  });
});


================================================
FILE: packages/core/tests/unit/model-utils.test.ts
================================================
import { describe, expect, it } from "vitest";
import { extractModelName, resolveModel } from "../../lib/modelUtils.js";

describe("extractModelName", () => {
  it("returns undefined for undefined input", () => {
    expect(extractModelName(undefined)).toBeUndefined();
  });

  it("returns the string as-is for a string input", () => {
    expect(extractModelName("openai/gpt-4o")).toBe("openai/gpt-4o");
  });

  it("returns modelName from an object input", () => {
    expect(
      extractModelName({ modelName: "anthropic/claude-sonnet-4-20250514" }),
    ).toBe("anthropic/claude-sonnet-4-20250514");
  });

  it("returns modelName from an object with extra properties", () => {
    expect(
      extractModelName({
        modelName: "openai/gpt-4o-mini",
        apiKey: "sk-test",
        baseURL: "https://custom.endpoint",
      }),
    ).toBe("openai/gpt-4o-mini");
  });
});

describe("resolveModel", () => {
  it("extracts provider and modelName from a string", () => {
    const result = resolveModel("openai/gpt-4o");
    expect(result.provider).toBe("openai");
    expect(result.modelName).toBe("gpt-4o");
    expect(result.clientOptions).toEqual({});
  });

  it("extracts clientOptions from an object config", () => {
    const result = resolveModel({
      modelName: "openai/gpt-4o" as never,
      apiKey: "sk-test",
    });
    expect(result.provider).toBe("openai");
    expect(result.modelName).toBe("gpt-4o");
    expect(result.clientOptions).toMatchObject({ apiKey: "sk-test" });
    // modelName should not leak into clientOptions
    expect(result.clientOptions).not.toHaveProperty("modelName");
  });
});


================================================
FILE: packages/core/tests/unit/openai-cua-client.test.ts
================================================
import { describe, expect, it, vi } from "vitest";
import { OpenAICUAClient } from "../../lib/v3/agent/OpenAICUAClient.js";

function createClient() {
  return new OpenAICUAClient(
    "openai",
    "computer-use-preview-2025-03-11",
    undefined,
    { apiKey: "test-key" },
  );
}

describe("OpenAICUAClient", () => {
  it("exposes captchaSolvedProceed tool after a captcha context note", () => {
    const client = createClient();

    // Before captcha note — tool should not be active
    expect(
      (client as unknown as { captchaSolvedToolActive: boolean })
        .captchaSolvedToolActive,
    ).toBe(false);

    // Simulate a captcha context note being added (as the CUA handler does)
    client.addContextNote(
      "A captcha was automatically detected and solved — no further interaction needed.",
    );

    expect(
      (client as unknown as { captchaSolvedToolActive: boolean })
        .captchaSolvedToolActive,
    ).toBe(true);
  });

  it("does NOT activate captcha tool for non-captcha context notes", () => {
    const client = createClient();

    client.addContextNote("The page has finished loading.");

    expect(
      (client as unknown as { captchaSolvedToolActive: boolean })
        .captchaSolvedToolActive,
    ).toBe(false);
  });

  it("deactivates captcha tool after takeAction handles the function call", async () => {
    const client = createClient();
    client.addContextNote("A captcha was solved.");

    expect(
      (client as unknown as { captchaSolvedToolActive: boolean })
        .captchaSolvedToolActive,
    ).toBe(true);

    // Simulate the model calling the captchaSolvedProceed tool
    const result = await (
      client as unknown as {
        takeAction: (
          output: unknown[],
          logger: (msg: unknown) => void,
        ) => Promise<unknown[]>;
      }
    ).takeAction(
      [
        {
          type: "function_call",
          name: "captchaSolvedProceed",
          call_id: "call-1",
          arguments: "{}",
        },
      ],
      vi.fn(),
    );

    // Tool should be deactivated
    expect(
      (client as unknown as { captchaSolvedToolActive: boolean })
        .captchaSolvedToolActive,
    ).toBe(false);

    // Result should contain a function_call_output confirming proceed
    expect(result).toEqual([
      {
        type: "function_call_output",
        call_id: "call-1",
        output: expect.stringContaining("Continue completing"),
      },
    ]);
  });

  it("does NOT auto-continue follow-up questions without a captcha context", async () => {
    const client = createClient();
    // No captcha context note — no tool should be exposed

    type ExecuteStepResult = {
      actions: Array<{ type: string }>;
      message: string;
      completed: boolean;
      nextInputItems: unknown[];
      responseId: string;
      usage: {
        input_tokens: number;
        output_tokens: number;
        inference_time_ms: number;
      };
    };

    const executeStepSpy = vi.spyOn(
      client as unknown as {
        executeStep: (
          inputItems: unknown[],
          previousResponseId: string | undefined,
          logger: (message: { message: string }) => void,
        ) => Promise<ExecuteStepResult>;
      },
      "executeStep",
    );

    executeStepSpy.mockResolvedValueOnce({
      actions: [],
      message:
        "I've located the Submit button. Should I go ahead and submit it?",
      completed: true,
      nextInputItems: [],
      responseId: "response-1",
      usage: { input_tokens: 1, output_tokens: 1, inference_time_ms: 1 },
    });

    const result = await client.execute({
      options: { instruction: "Submit the form.", maxSteps: 10 } as never,
      logger: vi.fn(),
    });

    // Should NOT have continued — the model's follow-up is treated as completion
    expect(executeStepSpy).toHaveBeenCalledTimes(1);
    expect(result.completed).toBe(true);
  });
});


================================================
FILE: packages/core/tests/unit/page-extra-http-headers.test.ts
================================================
import { describe, expect, it } from "vitest";
import { Page } from "../../lib/v3/understudy/page.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";
import { StagehandSetExtraHTTPHeadersError } from "../../lib/v3/types/public/sdkErrors.js";

type PageStub = {
  mainSession: MockCDPSession;
  sessions: Map<string, MockCDPSession>;
  extraHTTPHeaders: Record<string, string>;
  applyExtraHTTPHeadersToSession: (
    session: MockCDPSession,
    headers: Record<string, string>,
  ) => Promise<void>;
};

const makePage = (sessions: MockCDPSession[]): PageStub => {
  const mainSession = sessions[0] ?? new MockCDPSession({}, "main");
  const stub: PageStub = {
    mainSession,
    sessions: new Map(sessions.map((s) => [s.id, s])),
    extraHTTPHeaders: {},
    // Bind the private helper from Page.prototype so setExtraHTTPHeaders can call it
    applyExtraHTTPHeadersToSession: (Page.prototype as unknown as PageStub)
      .applyExtraHTTPHeadersToSession,
  };
  return stub;
};

describe("Page.setExtraHTTPHeaders", () => {
  const setExtraHTTPHeaders = Page.prototype.setExtraHTTPHeaders as (
    this: PageStub,
    headers: Record<string, string>,
  ) => Promise<void>;

  it("sends headers to all sessions owned by the page", async () => {
    const sessionA = new MockCDPSession({}, "session-a");
    const sessionB = new MockCDPSession({}, "session-b");
    const page = makePage([sessionA, sessionB]);

    await setExtraHTTPHeaders.call(page, {
      "x-stagehand-test": "hello",
    });

    for (const session of [sessionA, sessionB]) {
      expect(session.callsFor("Network.enable").length).toBe(1);
      expect(
        session.callsFor("Network.setExtraHTTPHeaders")[0]?.params,
      ).toEqual({
        headers: { "x-stagehand-test": "hello" },
      });
    }
  });

  it("applies headers to mainSession even when sessions map is empty", async () => {
    const page = makePage([]);

    await setExtraHTTPHeaders.call(page, { "x-test": "value" });

    // mainSession should still receive headers even though it's not in the sessions map
    expect(page.mainSession.callsFor("Network.enable").length).toBe(1);
    expect(
      page.mainSession.callsFor("Network.setExtraHTTPHeaders")[0]?.params,
    ).toEqual({
      headers: { "x-test": "value" },
    });
  });

  it("throws StagehandSetExtraHTTPHeadersError with session failure details", async () => {
    const sessionA = new MockCDPSession(
      {
        "Network.setExtraHTTPHeaders": () => {
          throw new Error("connection closed");
        },
      },
      "session-a",
    );
    const sessionB = new MockCDPSession({}, "session-b");
    const page = makePage([sessionA, sessionB]);

    let caughtError: StagehandSetExtraHTTPHeadersError | undefined;
    try {
      await setExtraHTTPHeaders.call(page, {
        "x-stagehand-test": "yes",
      });
    } catch (error) {
      caughtError = error as StagehandSetExtraHTTPHeadersError;
    }

    expect(caughtError).toBeInstanceOf(StagehandSetExtraHTTPHeadersError);
    expect(caughtError?.failures).toHaveLength(1);
    expect(caughtError?.failures[0]).toContain("session=session-a");
    expect(caughtError?.failures[0]).toContain("connection closed");

    // sessionB should still have been called successfully
    expect(sessionB.callsFor("Network.setExtraHTTPHeaders").length).toBe(1);
  });

  it("applies headers to sessions adopted after the call", async () => {
    const sessionA = new MockCDPSession({}, "session-a");
    const page = makePage([sessionA]);

    await setExtraHTTPHeaders.call(page, { "x-before": "yes" });

    // A new OOPIF session is adopted after headers were set
    const sessionB = new MockCDPSession({}, "session-b");
    page.sessions.set(sessionB.id, sessionB);

    // Simulate what adoptOopifSession does: replay headers onto the new session
    await page.applyExtraHTTPHeadersToSession.call(
      page,
      sessionB,
      page.extraHTTPHeaders,
    );

    // The late-arriving session should have received the headers
    expect(sessionB.callsFor("Network.enable").length).toBe(1);
    expect(sessionB.callsFor("Network.setExtraHTTPHeaders")[0]?.params).toEqual(
      {
        headers: { "x-before": "yes" },
      },
    );
  });

  it("does not mutate the original headers object", async () => {
    const session = new MockCDPSession({}, "session-a");
    const page = makePage([session]);

    const original = { "x-custom": "value" };
    const frozen = { ...original };

    await setExtraHTTPHeaders.call(page, original);

    expect(original).toEqual(frozen);
  });
});


================================================
FILE: packages/core/tests/unit/page-snapshot.test.ts
================================================
import { afterEach, describe, expect, it, vi } from "vitest";
import { promises as fs } from "fs";
import { Page } from "../../lib/v3/understudy/page.js";
import * as snapshotModule from "../../lib/v3/understudy/a11y/snapshot/index.js";
import type { HybridSnapshot } from "../../lib/v3/types/private/index.js";

const baseSnapshot: HybridSnapshot = {
  combinedTree: "tree",
  combinedXpathMap: {},
  combinedUrlMap: {},
  perFrame: [],
};

describe("Page.snapshot", () => {
  afterEach(() => {
    vi.restoreAllMocks();
  });

  it("forwards the includeIframes flag to captureHybridSnapshot", async () => {
    vi.spyOn(fs, "writeFile").mockResolvedValue();
    const captureSpy = vi
      .spyOn(snapshotModule, "captureHybridSnapshot")
      .mockResolvedValue(baseSnapshot);

    const fakePage = {} as Page;
    await Page.prototype.snapshot.call(fakePage, { includeIframes: false });

    expect(captureSpy).toHaveBeenCalledWith(fakePage, {
      pierceShadow: true,
      includeIframes: false,
    });
  });

  it("falls back to default iframe inclusion when option is omitted", async () => {
    vi.spyOn(fs, "writeFile").mockResolvedValue();
    const captureSpy = vi
      .spyOn(snapshotModule, "captureHybridSnapshot")
      .mockResolvedValue(baseSnapshot);

    const fakePage = {} as Page;
    await Page.prototype.snapshot.call(fakePage);

    expect(captureSpy).toHaveBeenCalledWith(fakePage, {
      pierceShadow: true,
      includeIframes: undefined,
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/export-surface.test.ts
================================================
import { describe, expect, it } from "vitest";
import StagehandDefaultExport, * as Stagehand from "@browserbasehq/stagehand";
import { publicErrorTypes } from "./public-error-types.test.js";

// Type matcher guidelines:
//
// toEqualTypeOf – Default. Assert full, deep type equality; any type change should fail.
//   e.g. expectTypeOf<ReturnType<typeof foo>>().toEqualTypeOf<FooResult>()
//
// toMatchObjectType – Assert (part of) an object's shape while allowing extra fields.
//   e.g. expectTypeOf(user).toMatchObjectType<{ id: string; email: string }>()
//
// toExtend – Assert that a type is compatible with a broader contract (assignable/extends).
//   e.g. expectTypeOf<User>().toExtend<BaseUser>()

const publicApiShape = {
  __internalMaybeRunShutdownSupervisorFromArgv:
    Stagehand.__internalMaybeRunShutdownSupervisorFromArgv,
  __internalCreateInMemoryAgentCacheHandle:
    Stagehand.__internalCreateInMemoryAgentCacheHandle,
  AISdkClient: Stagehand.AISdkClient,
  Api: Stagehand.Api,
  AVAILABLE_CUA_MODELS: Stagehand.AVAILABLE_CUA_MODELS,
  AgentProvider: Stagehand.AgentProvider,
  AnnotatedScreenshotText: Stagehand.AnnotatedScreenshotText,
  ConsoleMessage: Stagehand.ConsoleMessage,
  CustomOpenAIClient: Stagehand.CustomOpenAIClient,
  LLMClient: Stagehand.LLMClient,
  LOG_LEVEL_NAMES: Stagehand.LOG_LEVEL_NAMES,
  Response: Stagehand.Response,
  Stagehand: Stagehand.Stagehand,
  V3: Stagehand.V3,
  V3Evaluator: Stagehand.V3Evaluator,
  V3FunctionName: Stagehand.V3FunctionName,
  connectToMCPServer: Stagehand.connectToMCPServer,
  default: StagehandDefaultExport,
  defaultExtractSchema: Stagehand.defaultExtractSchema,
  getAISDKLanguageModel: Stagehand.getAISDKLanguageModel,
  getZodType: Stagehand.getZodType,
  injectUrls: Stagehand.injectUrls,
  isRunningInBun: Stagehand.isRunningInBun,
  isZod3Schema: Stagehand.isZod3Schema,
  isZod4Schema: Stagehand.isZod4Schema,
  jsonSchemaToZod: Stagehand.jsonSchemaToZod,
  loadApiKeyFromEnv: Stagehand.loadApiKeyFromEnv,
  localBrowserLaunchOptionsSchema: Stagehand.localBrowserLaunchOptionsSchema,
  modelToAgentProviderMap: Stagehand.modelToAgentProviderMap,
  pageTextSchema: Stagehand.pageTextSchema,
  providerEnvVarMap: Stagehand.providerEnvVarMap,
  toGeminiSchema: Stagehand.toGeminiSchema,
  toJsonSchema: Stagehand.toJsonSchema,
  tool: Stagehand.tool,
  transformSchema: Stagehand.transformSchema,
  trimTrailingTextNode: Stagehand.trimTrailingTextNode,
  validateZodSchema: Stagehand.validateZodSchema,
  ...publicErrorTypes,
} as const;

type StagehandExports = typeof Stagehand & {
  default: typeof StagehandDefaultExport;
};

type PublicAPI = {
  [K in keyof typeof publicApiShape]: StagehandExports[K];
};

describe("Stagehand public API export surface", () => {
  it("public API shape matches module exports", () => {
    const _check: PublicAPI = publicApiShape;
    void _check;
  });

  it("does not expose unexpected top-level exports", () => {
    const expected = Object.keys(publicApiShape).sort();
    const actual = Object.keys(Stagehand).sort();
    expect(actual).toStrictEqual(expected);
  });

  it("default export mirrors the named export surface", () => {
    const expected = Object.keys(Stagehand)
      .filter((key) => key !== "default")
      .sort();
    const actual = Object.keys(StagehandDefaultExport).sort();
    expect(actual).toStrictEqual(expected);
  });
});


================================================
FILE: packages/core/tests/unit/public-api/llm-and-agents.test.ts
================================================
import { describe, expect, expectTypeOf, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

describe("LLM and Agents public API types", () => {
  describe("ModelConfiguration", () => {
    it("accepts Vertex headers in model config", () => {
      const googleConfig = {
        modelName: "google/gemini-3-flash-preview",
        project: "test-project",
        location: "global",
        headers: {
          "X-Goog-Priority": "high",
        },
      } satisfies Stagehand.ModelConfiguration;

      void googleConfig;
    });
  });

  describe("AISdkClient", () => {
    type AISdkClientInstance = InstanceType<typeof Stagehand.AISdkClient>;

    it("is exported", () => {
      expect(Stagehand.AISdkClient).toBeDefined();
    });

    it("extends LLMClient", () => {
      expectTypeOf<AISdkClientInstance>().toExtend<Stagehand.LLMClient>();
    });

    it("constructor accepts model parameter", () => {
      // AISdkClient constructor takes { model: LanguageModelV2 }
      type CtorParams = ConstructorParameters<typeof Stagehand.AISdkClient>;
      expectTypeOf<CtorParams["length"]>().toEqualTypeOf<1>();
    });
  });

  describe("AVAILABLE_CUA_MODELS", () => {
    const expectedModels = [
      "openai/computer-use-preview",
      "openai/computer-use-preview-2025-03-11",
      "anthropic/claude-opus-4-5-20251101",
      "anthropic/claude-opus-4-6",
      "anthropic/claude-sonnet-4-6",
      "anthropic/claude-haiku-4-5-20251001",
      "anthropic/claude-sonnet-4-20250514",
      "anthropic/claude-sonnet-4-5-20250929",
      "google/gemini-2.5-computer-use-preview-10-2025",
      "google/gemini-3-flash-preview",
      "google/gemini-3-pro-preview",
      "microsoft/fara-7b",
    ] as const;

    it("AvailableCuaModel matches the known literals", () => {
      expectTypeOf<Stagehand.AvailableCuaModel>().toEqualTypeOf<
        (typeof expectedModels)[number]
      >();
      void expectedModels; // Mark as used to satisfy ESLint
    });
  });

  describe("AgentProvider", () => {
    type AgentProviderInstance = InstanceType<typeof Stagehand.AgentProvider>;

    it("is exported", () => {
      expect(Stagehand.AgentProvider).toBeDefined();
    });

    it("has getClient method", () => {
      expectTypeOf<AgentProviderInstance["getClient"]>().toBeCallableWith(
        "test-model",
      );
    });

    it("constructor accepts logger parameter", () => {
      expectTypeOf<
        ConstructorParameters<typeof Stagehand.AgentProvider>
      >().toEqualTypeOf<[(message: Stagehand.LogLine) => void]>();
    });
  });

  describe("AnnotatedScreenshotText", () => {
    type ExpectedAnnotatedScreenshotText = string;

    it("is a string literal", () => {
      expectTypeOf<
        typeof Stagehand.AnnotatedScreenshotText
      >().toExtend<ExpectedAnnotatedScreenshotText>();
    });
  });

  describe("ConsoleMessage", () => {
    type ExpectedShape = {
      type: () => string;
      text: () => string;
      args: () => unknown[];
      location: () => {
        url?: string;
        lineNumber?: number;
        columnNumber?: number;
      };
      page: () => unknown;
      timestamp: () => number | undefined;
      raw: () => unknown;
      toString: () => string;
    };

    type ConsoleMessageInstance = InstanceType<typeof Stagehand.ConsoleMessage>;

    it("has correct public interface shape", () => {
      expectTypeOf<ConsoleMessageInstance>().toExtend<ExpectedShape>();
    });
  });

  describe("AgentClient", () => {
    type AgentProviderInstance = InstanceType<typeof Stagehand.AgentProvider>;
    type GetClientReturn = ReturnType<AgentProviderInstance["getClient"]>;

    it("getClient returns object with expected methods", () => {
      type ExpectedShape = {
        execute: (
          options: Stagehand.AgentExecutionOptions,
        ) => Promise<Stagehand.AgentResult>;
        captureScreenshot: (
          options?: Record<string, unknown>,
        ) => Promise<unknown>;
        setViewport: (width: number, height: number) => void;
        setCurrentUrl: (url: string) => void;
        setScreenshotProvider: (provider: () => Promise<string>) => void;
        setActionHandler: (
          handler: (action: Stagehand.AgentAction) => Promise<void>,
        ) => void;
      };
      expectTypeOf<GetClientReturn>().toExtend<ExpectedShape>();
    });
  });

  describe("LLMClient", () => {
    type ExpectedShape = {
      type: "openai" | "anthropic" | "cerebras" | "groq" | (string & {});
      modelName: Stagehand.AvailableModel | (string & {});
      hasVision: boolean;
      clientOptions: Stagehand.ClientOptions;
      userProvidedInstructions?: string;
    };

    type ExpectedCtorParams = [Stagehand.AvailableModel, string?];

    type ExpectedBasicOptions = {
      options: {
        messages: Array<{
          role: "system" | "user" | "assistant";
          content: string | Array<unknown>;
        }>;
      };
      logger: (message: unknown) => void;
      retries?: number;
    };

    type ExpectedWithResponseModel = ExpectedBasicOptions & {
      options: ExpectedBasicOptions["options"] & {
        response_model: {
          name: string;
          schema: Stagehand.StagehandZodSchema;
        };
      };
    };

    type LLMClientInstance = InstanceType<typeof Stagehand.LLMClient>;

    it("has correct public interface shape", () => {
      expectTypeOf<LLMClientInstance>().toExtend<ExpectedShape>();
    });

    it("constructor parameters match expected signature", () => {
      expectTypeOf<
        ConstructorParameters<typeof Stagehand.LLMClient>
      >().toEqualTypeOf<ExpectedCtorParams>();
    });

    it("createChatCompletion can be called with basic options", () => {
      expectTypeOf<
        LLMClientInstance["createChatCompletion"]
      >().toBeCallableWith({
        options: {
          messages: [
            {
              role: "user",
              content: "Hello",
            },
          ],
        },
        logger: () => {},
      } satisfies ExpectedBasicOptions);
    });

    it("createChatCompletion can be called with response_model", () => {
      const mockSchema = {} as Stagehand.StagehandZodSchema;
      expectTypeOf<
        LLMClientInstance["createChatCompletion"]
      >().toBeCallableWith({
        options: {
          messages: [
            {
              role: "user",
              content: "Extract data",
            },
          ],
          response_model: {
            name: "extracted",
            schema: mockSchema,
          },
        },
        logger: () => {},
      } satisfies ExpectedWithResponseModel);
    });

    it("createChatCompletion supports generic return type", () => {
      type Result = { custom: string };
      type ExpectedSignature = (
        options: Stagehand.CreateChatCompletionOptions,
      ) => Promise<Result>;

      expectTypeOf<
        LLMClientInstance["createChatCompletion"]
      >().toExtend<ExpectedSignature>();
    });

    it("has additional methods", () => {
      // These methods exist on LLMClient but have complex signatures from the 'ai' library
      // We verify they exist by checking they're functions
      expectTypeOf<LLMClientInstance["generateText"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["generateObject"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["streamText"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["streamObject"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["generateImage"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["embed"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["embedMany"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["transcribe"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
      expectTypeOf<LLMClientInstance["generateSpeech"]>().toExtend<
        (...args: unknown[]) => unknown
      >();
    });
  });

  describe("modelToAgentProviderMap", () => {
    type ExpectedModelToAgentProviderMap = Record<
      string,
      Stagehand.AgentProviderType
    >;

    it("only stores valid provider types", () => {
      expectTypeOf<
        typeof Stagehand.modelToAgentProviderMap
      >().toExtend<ExpectedModelToAgentProviderMap>();
    });
  });

  describe("Response", () => {
    type ExpectedShape = {
      url: () => string;
      status: () => number;
      statusText: () => string;
      ok: () => boolean;
      frame: () => unknown;
      fromServiceWorker: () => boolean;
      securityDetails: () => Promise<unknown>;
      serverAddr: () => Promise<unknown>;
      headers: () => Record<string, string>;
      allHeaders: () => Promise<Record<string, string>>;
      headerValue: (name: string) => Promise<string | null>;
      headerValues: (name: string) => Promise<string[]>;
      headersArray: () => Promise<Array<{ name: string; value: string }>>;
      body: () => Promise<Buffer>;
      text: () => Promise<string>;
      json: <T = unknown>() => Promise<T>;
      finished: () => Promise<null | Error>;
      markFinished: (error: Error | null) => void;
      applyExtraInfo: (info: unknown) => void;
    };

    type ResponseInstance = InstanceType<typeof Stagehand.Response>;

    it("has correct public interface shape", () => {
      expectTypeOf<ResponseInstance>().toExtend<ExpectedShape>();
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/public-error-types.test.ts
================================================
import { describe, expectTypeOf, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

export const publicErrorTypes = {
  AgentAbortError: Stagehand.AgentAbortError,
  CdpConnectionClosedError: Stagehand.CdpConnectionClosedError,
  AgentScreenshotProviderError: Stagehand.AgentScreenshotProviderError,
  BrowserbaseSessionNotFoundError: Stagehand.BrowserbaseSessionNotFoundError,
  CaptchaTimeoutError: Stagehand.CaptchaTimeoutError,
  ConnectionTimeoutError: Stagehand.ConnectionTimeoutError,
  ContentFrameNotFoundError: Stagehand.ContentFrameNotFoundError,
  CookieSetError: Stagehand.CookieSetError,
  CookieValidationError: Stagehand.CookieValidationError,
  CreateChatCompletionResponseError:
    Stagehand.CreateChatCompletionResponseError,
  CuaModelRequiredError: Stagehand.CuaModelRequiredError,
  ElementNotVisibleError: Stagehand.ElementNotVisibleError,
  ExperimentalApiConflictError: Stagehand.ExperimentalApiConflictError,
  ExperimentalNotConfiguredError: Stagehand.ExperimentalNotConfiguredError,
  HandlerNotInitializedError: Stagehand.HandlerNotInitializedError,
  InvalidAISDKModelFormatError: Stagehand.InvalidAISDKModelFormatError,
  LLMResponseError: Stagehand.LLMResponseError,
  MCPConnectionError: Stagehand.MCPConnectionError,
  MissingEnvironmentVariableError: Stagehand.MissingEnvironmentVariableError,
  MissingLLMConfigurationError: Stagehand.MissingLLMConfigurationError,
  PageNotFoundError: Stagehand.PageNotFoundError,
  ResponseBodyError: Stagehand.ResponseBodyError,
  ResponseParseError: Stagehand.ResponseParseError,
  StagehandAPIError: Stagehand.StagehandAPIError,
  StagehandAPIUnauthorizedError: Stagehand.StagehandAPIUnauthorizedError,
  StagehandClickError: Stagehand.StagehandClickError,
  StagehandClosedError: Stagehand.StagehandClosedError,
  StagehandDefaultError: Stagehand.StagehandDefaultError,
  StagehandDomProcessError: Stagehand.StagehandDomProcessError,
  StagehandElementNotFoundError: Stagehand.StagehandElementNotFoundError,
  StagehandEnvironmentError: Stagehand.StagehandEnvironmentError,
  StagehandError: Stagehand.StagehandError,
  StagehandEvalError: Stagehand.StagehandEvalError,
  StagehandHttpError: Stagehand.StagehandHttpError,
  StagehandIframeError: Stagehand.StagehandIframeError,
  StagehandInitError: Stagehand.StagehandInitError,
  StagehandInvalidArgumentError: Stagehand.StagehandInvalidArgumentError,
  StagehandLocatorError: Stagehand.StagehandLocatorError,
  StagehandMissingArgumentError: Stagehand.StagehandMissingArgumentError,
  StagehandNotInitializedError: Stagehand.StagehandNotInitializedError,
  StagehandResponseBodyError: Stagehand.StagehandResponseBodyError,
  StagehandResponseParseError: Stagehand.StagehandResponseParseError,
  StagehandServerError: Stagehand.StagehandServerError,
  StagehandShadowRootMissingError: Stagehand.StagehandShadowRootMissingError,
  StagehandShadowSegmentEmptyError: Stagehand.StagehandShadowSegmentEmptyError,
  StagehandShadowSegmentNotFoundError:
    Stagehand.StagehandShadowSegmentNotFoundError,
  StreamingCallbacksInNonStreamingModeError:
    Stagehand.StreamingCallbacksInNonStreamingModeError,
  StagehandSnapshotError: Stagehand.StagehandSnapshotError,
  TimeoutError: Stagehand.TimeoutError,
  UnsupportedAISDKModelProviderError:
    Stagehand.UnsupportedAISDKModelProviderError,
  UnsupportedModelError: Stagehand.UnsupportedModelError,
  UnsupportedModelProviderError: Stagehand.UnsupportedModelProviderError,
  XPathResolutionError: Stagehand.XPathResolutionError,
  ZodSchemaValidationError: Stagehand.ZodSchemaValidationError,
  ActTimeoutError: Stagehand.ActTimeoutError,
  ObserveTimeoutError: Stagehand.ObserveTimeoutError,
  ExtractTimeoutError: Stagehand.ExtractTimeoutError,
  UnderstudyCommandException: Stagehand.UnderstudyCommandException,
  StagehandSetExtraHTTPHeadersError:
    Stagehand.StagehandSetExtraHTTPHeadersError,
} as const;

const errorTypes = Object.keys(publicErrorTypes) as Array<
  keyof typeof publicErrorTypes
>;

describe("Stagehand public error types", () => {
  describe("errors", () => {
    it.each(errorTypes)("%s extends Error", (errorTypeName) => {
      const ErrorClass = Stagehand[errorTypeName];
      type ErrorClassType = typeof ErrorClass;
      expectTypeOf<InstanceType<ErrorClassType>>().toExtend<Error>();
      void ErrorClass; // Mark as used to satisfy ESLint
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/public-types.test.ts
================================================
import { describe, expectTypeOf, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

// Type-level manifest of all expected exported types
// Since these types don't exist at runtime, we currently need to manually add new publicly exported types
// to this list ourselves - it's not automatically going to catch changes like our export-surface.test.ts does.

// eslint-disable-next-line @typescript-eslint/no-unused-vars
type ExpectedExportedTypes = {
  // Types from model.ts
  AvailableModel: Stagehand.AvailableModel;
  AvailableCuaModel: Stagehand.AvailableCuaModel;
  ModelProvider: Stagehand.ModelProvider;
  ClientOptions: Stagehand.ClientOptions;
  ModelConfiguration: Stagehand.ModelConfiguration;
  AnthropicJsonSchemaObject: Stagehand.AnthropicJsonSchemaObject;
  AISDKProvider: Stagehand.AISDKProvider;
  AISDKCustomProvider: Stagehand.AISDKCustomProvider;
  LLMTool: Stagehand.LLMTool;
  // Types from methods.ts
  ActOptions: Stagehand.ActOptions;
  ActResult: Stagehand.ActResult;
  ExtractResult: Stagehand.ExtractResult<Stagehand.StagehandZodSchema>;
  Action: Stagehand.Action;
  HistoryEntry: Stagehand.HistoryEntry;
  ExtractOptions: Stagehand.ExtractOptions;
  ObserveOptions: Stagehand.ObserveOptions;
  ObserveResult: Stagehand.ObserveResult;
  V3FunctionName: Stagehand.V3FunctionName;
  // Types from agent.ts
  Tool: Stagehand.Tool;
  AgentAction: Stagehand.AgentAction;
  AgentResult: Stagehand.AgentResult;
  AgentExecuteOptions: Stagehand.AgentExecuteOptions;
  AgentType: Stagehand.AgentType;
  AgentExecutionOptions: Stagehand.AgentExecutionOptions<Stagehand.AgentExecuteOptions>;
  AgentHandlerOptions: Stagehand.AgentHandlerOptions;
  ActionExecutionResult: Stagehand.ActionExecutionResult;
  ToolUseItem: Stagehand.ToolUseItem;
  AnthropicMessage: Stagehand.AnthropicMessage;
  AnthropicContentBlock: Stagehand.AnthropicContentBlock;
  AnthropicTextBlock: Stagehand.AnthropicTextBlock;
  AnthropicToolResult: Stagehand.AnthropicToolResult;
  ResponseItem: Stagehand.ResponseItem;
  ComputerCallItem: Stagehand.ComputerCallItem;
  FunctionCallItem: Stagehand.FunctionCallItem;
  ResponseInputItem: Stagehand.ResponseInputItem;
  AgentInstance: Stagehand.AgentInstance;
  AgentProviderType: Stagehand.AgentProviderType;
  AgentModelConfig: Stagehand.AgentModelConfig;
  AgentConfig: Stagehand.AgentConfig;
  AgentToolMode: Stagehand.AgentToolMode;
  VariableValue: Stagehand.VariableValue;
  Variables: Stagehand.Variables;
  AgentCallbacks: Stagehand.AgentCallbacks;
  AgentExecuteCallbacks: Stagehand.AgentExecuteCallbacks;
  AgentStreamCallbacks: Stagehand.AgentStreamCallbacks;
  AgentExecuteOptionsBase: Stagehand.AgentExecuteOptionsBase;
  AgentStreamExecuteOptions: Stagehand.AgentStreamExecuteOptions;
  ModelMessage: Stagehand.ModelMessage;
  // Types from agent/tools
  AgentTools: Stagehand.AgentTools;
  AgentToolTypesMap: Stagehand.AgentToolTypesMap;
  AgentUITools: Stagehand.AgentUITools;
  AgentToolCall: Stagehand.AgentToolCall;
  AgentToolResult: Stagehand.AgentToolResult;
  // Types from logs.ts
  LogLevel: Stagehand.LogLevel;
  LogLine: Stagehand.LogLine;
  Logger: Stagehand.Logger;
  // Types from metrics.ts
  StagehandMetrics: Stagehand.StagehandMetrics;
  // Types from options.ts
  V3Env: Stagehand.V3Env;
  LocalBrowserLaunchOptions: Stagehand.LocalBrowserLaunchOptions;
  V3Options: Stagehand.V3Options;
  // Types from page.ts
  AnyPage: Stagehand.AnyPage;
  Page: Stagehand.Page;
  PlaywrightPage: Stagehand.PlaywrightPage;
  PatchrightPage: Stagehand.PatchrightPage;
  PuppeteerPage: Stagehand.PuppeteerPage;
  ConsoleListener: Stagehand.ConsoleListener;
  LoadState: Stagehand.LoadState;
  // Types from LLMClient.ts
  ChatMessage: Stagehand.ChatMessage;
  ChatMessageContent: Stagehand.ChatMessageContent;
  ChatMessageImageContent: Stagehand.ChatMessageImageContent;
  ChatMessageTextContent: Stagehand.ChatMessageTextContent;
  ChatCompletionOptions: Stagehand.ChatCompletionOptions;
  LLMResponse: Stagehand.LLMResponse;
  CreateChatCompletionOptions: Stagehand.CreateChatCompletionOptions;
  LLMUsage: Stagehand.LLMUsage;
  LLMParsedResponse: Stagehand.LLMParsedResponse<Record<string, unknown>>;
  // Types from zodCompat.ts
  StagehandZodSchema: Stagehand.StagehandZodSchema;
  StagehandZodObject: Stagehand.StagehandZodObject;
  InferStagehandSchema: Stagehand.InferStagehandSchema<Stagehand.StagehandZodSchema>;
  JsonSchemaDocument: Stagehand.JsonSchemaDocument;
  // Types from utils.ts
  JsonSchema: Stagehand.JsonSchema;
  JsonSchemaProperty: Stagehand.JsonSchemaProperty;
  // Types from cookies.ts
  Cookie: Stagehand.Cookie;
  CookieParam: Stagehand.CookieParam;
  ClearCookieOptions: Stagehand.ClearCookieOptions;
};

describe("Stagehand public API types", () => {
  describe("AnyPage", () => {
    type ExpectedAnyPage =
      | Stagehand.PlaywrightPage
      | Stagehand.PuppeteerPage
      | Stagehand.PatchrightPage
      | Stagehand.Page;

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.AnyPage>().toEqualTypeOf<ExpectedAnyPage>();
    });
  });

  describe("ActOptions", () => {
    type ExpectedActOptions = {
      model?: Stagehand.ModelConfiguration;
      variables?: Stagehand.Variables;
      timeout?: number;
      page?: Stagehand.AnyPage;
      serverCache?: boolean;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.ActOptions>().toEqualTypeOf<ExpectedActOptions>();
    });
  });

  describe("ActResult", () => {
    type ExpectedActResult = {
      success: boolean;
      message: string;
      actionDescription: string;
      actions: Stagehand.Action[];
      cacheStatus?: "HIT" | "MISS";
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.ActResult>().toEqualTypeOf<ExpectedActResult>();
    });
  });

  describe("ExtractOptions", () => {
    type ExpectedExtractOptions = {
      model?: Stagehand.ModelConfiguration;
      timeout?: number;
      selector?: string;
      page?: Stagehand.AnyPage;
      serverCache?: boolean;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.ExtractOptions>().toEqualTypeOf<ExpectedExtractOptions>();
    });
  });

  describe("ObserveOptions", () => {
    type ExpectedObserveOptions = {
      model?: Stagehand.ModelConfiguration;
      timeout?: number;
      selector?: string;
      page?: Stagehand.AnyPage;
      serverCache?: boolean;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.ObserveOptions>().toEqualTypeOf<ExpectedObserveOptions>();
    });
  });

  describe("ObserveResult", () => {
    it("is an Action array with optional cacheStatus", () => {
      expectTypeOf<Stagehand.ObserveResult>().toExtend<Stagehand.Action[]>();
      expectTypeOf<Stagehand.ObserveResult["cacheStatus"]>().toEqualTypeOf<
        "HIT" | "MISS" | undefined
      >();
    });
  });

  describe("Action", () => {
    type ExpectedAction = {
      selector: string;
      description: string;
      method?: string;
      arguments?: string[];
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.Action>().toEqualTypeOf<ExpectedAction>();
    });
  });

  describe("AgentAction", () => {
    // AgentAction is a separate type from Action, not an extension
    // It has additional fields like type, reasoning, taskCompleted, etc.
    it("has type field", () => {
      type TestAction = { type: string } & Stagehand.AgentAction;
      expectTypeOf<TestAction["type"]>().toEqualTypeOf<string>();
    });
  });

  describe("AgentExecuteOptions", () => {
    type ExpectedAgentExecuteOptions = {
      instruction: string;
      maxSteps?: number;
      page?: Stagehand.AnyPage;
      highlightCursor?: boolean;
      messages?: Stagehand.ModelMessage[];
      signal?: AbortSignal;
      excludeTools?: string[];
      output?: Stagehand.StagehandZodObject;
      callbacks?: Stagehand.AgentExecuteCallbacks;
      variables?: Stagehand.Variables;
      toolTimeout?: number;
      useSearch?: boolean;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.AgentExecuteOptions>().toEqualTypeOf<ExpectedAgentExecuteOptions>();
    });
  });

  describe("AgentStreamExecuteOptions", () => {
    type ExpectedAgentStreamExecuteOptions = {
      instruction: string;
      maxSteps?: number;
      page?: Stagehand.AnyPage;
      highlightCursor?: boolean;
      messages?: Stagehand.ModelMessage[];
      signal?: AbortSignal;
      excludeTools?: string[];
      output?: Stagehand.StagehandZodObject;
      callbacks?: Stagehand.AgentStreamCallbacks;
      variables?: Stagehand.Variables;
      toolTimeout?: number;
      useSearch?: boolean;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.AgentStreamExecuteOptions>().toEqualTypeOf<ExpectedAgentStreamExecuteOptions>();
    });
  });

  describe("AgentExecutionOptions", () => {
    type ExpectedAgentExecutionOptions<T = Stagehand.AgentExecuteOptions> = {
      options: T;
      logger: (message: Stagehand.LogLine) => void;
      retries?: number;
    };

    it("matches expected type shape", () => {
      expectTypeOf<
        Stagehand.AgentExecutionOptions<Stagehand.AgentExecuteOptions>
      >().toEqualTypeOf<
        ExpectedAgentExecutionOptions<Stagehand.AgentExecuteOptions>
      >();
    });
  });

  describe("AgentResult", () => {
    type ExpectedAgentResult = {
      success: boolean;
      message: string;
      actions: Stagehand.AgentAction[];
      completed: boolean;
      metadata?: Record<string, unknown>;
      usage?: {
        input_tokens: number;
        output_tokens: number;
        reasoning_tokens?: number;
        cached_input_tokens?: number;
        inference_time_ms: number;
      };
      messages?: Stagehand.ModelMessage[];
      output?: Record<string, unknown>;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.AgentResult>().toEqualTypeOf<ExpectedAgentResult>();
    });
  });

  describe("AgentConfig", () => {
    type ExpectedAgentConfig = {
      systemPrompt?: string;
      integrations?: (unknown | string)[];
      tools?: unknown;
      cua?: boolean;
      model?: string | Stagehand.AgentModelConfig<string>;
      executionModel?: string | Stagehand.AgentModelConfig<string>;
      stream?: boolean;
      mode?: Stagehand.AgentToolMode;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.AgentConfig>().toExtend<ExpectedAgentConfig>();
    });
  });

  describe("AgentToolMode", () => {
    type ExpectedAgentToolMode = "dom" | "hybrid" | "cua";

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.AgentToolMode>().toEqualTypeOf<ExpectedAgentToolMode>();
    });
  });

  describe("HistoryEntry", () => {
    type ExpectedHistoryEntry = {
      method: "act" | "extract" | "observe" | "navigate" | "agent";
      parameters: unknown;
      result: unknown;
      timestamp: string;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.HistoryEntry>().toEqualTypeOf<ExpectedHistoryEntry>();
    });
  });

  describe("Cookie", () => {
    type ExpectedCookie = {
      name: string;
      value: string;
      domain: string;
      path: string;
      expires: number;
      httpOnly: boolean;
      secure: boolean;
      sameSite: "Strict" | "Lax" | "None";
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.Cookie>().toEqualTypeOf<ExpectedCookie>();
    });
  });

  describe("CookieParam", () => {
    type ExpectedCookieParam = {
      name: string;
      value: string;
      url?: string;
      domain?: string;
      path?: string;
      expires?: number;
      httpOnly?: boolean;
      secure?: boolean;
      sameSite?: "Strict" | "Lax" | "None";
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.CookieParam>().toEqualTypeOf<ExpectedCookieParam>();
    });
  });

  describe("ClearCookieOptions", () => {
    type ExpectedClearCookieOptions = {
      name?: string | RegExp;
      domain?: string | RegExp;
      path?: string | RegExp;
    };

    it("matches expected type shape", () => {
      expectTypeOf<Stagehand.ClearCookieOptions>().toEqualTypeOf<ExpectedClearCookieOptions>();
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/runtime-utils.test.ts
================================================
import { describe, expectTypeOf, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

describe("Runtime Utils public API types", () => {
  describe("injectUrls", () => {
    type ExpectedInjectUrlsParams = [
      unknown,
      Array<string | number>,
      Record<string, string>,
    ];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.injectUrls,
      ).parameters.branded.toEqualTypeOf<ExpectedInjectUrlsParams>();
    });
  });

  describe("isRunningInBun", () => {
    type ExpectedIsRunningInBunParams = [];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.isRunningInBun,
      ).parameters.branded.toEqualTypeOf<ExpectedIsRunningInBunParams>();
    });
  });

  describe("loadApiKeyFromEnv", () => {
    type ExpectedLoadApiKeyFromEnvParams = [
      string | undefined,
      (logLine: Stagehand.LogLine) => void,
    ];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.loadApiKeyFromEnv,
      ).parameters.branded.toEqualTypeOf<ExpectedLoadApiKeyFromEnvParams>();
    });
  });

  describe("providerEnvVarMap", () => {
    type ExpectedProviderEnvVarMap = Partial<
      Record<string, string | Array<string>>
    >;

    it("maps providers to environment variable names", () => {
      expectTypeOf<
        typeof Stagehand.providerEnvVarMap
      >().toExtend<ExpectedProviderEnvVarMap>();
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/schema-utils.test.ts
================================================
import { describe, expectTypeOf, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

describe("Schema Utils public API types", () => {
  describe("defaultExtractSchema", () => {
    type ExpectedInferredType = { extraction: string };

    it("infers to the correct type", () => {
      expectTypeOf<
        Stagehand.InferStagehandSchema<typeof Stagehand.defaultExtractSchema>
      >().toEqualTypeOf<ExpectedInferredType>();
    });
  });

  describe("getZodType", () => {
    type ExpectedGetZodTypeParams = [Stagehand.StagehandZodSchema];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.getZodType,
      ).parameters.branded.toEqualTypeOf<ExpectedGetZodTypeParams>();
    });
  });

  describe("isZod3Schema", () => {
    type ExpectedIsZod3SchemaParams = [Stagehand.StagehandZodSchema];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.isZod3Schema,
      ).parameters.branded.toEqualTypeOf<ExpectedIsZod3SchemaParams>();
    });
  });

  describe("isZod4Schema", () => {
    type ExpectedIsZod4SchemaParams = [Stagehand.StagehandZodSchema];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.isZod4Schema,
      ).parameters.branded.toEqualTypeOf<ExpectedIsZod4SchemaParams>();
    });
  });

  describe("jsonSchemaToZod", () => {
    type ExpectedJsonSchemaToZodParams = [Stagehand.JsonSchema];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.jsonSchemaToZod,
      ).parameters.branded.toEqualTypeOf<ExpectedJsonSchemaToZodParams>();
    });
  });

  describe("pageTextSchema", () => {
    type ExpectedInferredType = { pageText: string };

    it("infers to the correct type", () => {
      expectTypeOf<
        Stagehand.InferStagehandSchema<typeof Stagehand.pageTextSchema>
      >().toEqualTypeOf<ExpectedInferredType>();
    });
  });

  describe("toGeminiSchema", () => {
    type ExpectedToGeminiSchemaParams = [Stagehand.StagehandZodSchema];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.toGeminiSchema,
      ).parameters.branded.toEqualTypeOf<ExpectedToGeminiSchemaParams>();
    });
  });

  describe("toJsonSchema", () => {
    type ExpectedToJsonSchemaParams = [Stagehand.StagehandZodSchema];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.toJsonSchema,
      ).parameters.branded.toEqualTypeOf<ExpectedToJsonSchemaParams>();
    });
  });

  describe("transformSchema", () => {
    type ExpectedTransformSchemaParams = [
      Stagehand.StagehandZodSchema,
      Array<string | number>,
    ];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.transformSchema,
      ).parameters.branded.toEqualTypeOf<ExpectedTransformSchemaParams>();
    });
  });

  describe("trimTrailingTextNode", () => {
    type ExpectedTrimTrailingTextNodeParams = [string | undefined];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.trimTrailingTextNode,
      ).parameters.branded.toEqualTypeOf<ExpectedTrimTrailingTextNodeParams>();
    });
  });

  describe("validateZodSchema", () => {
    type ExpectedValidateZodSchemaParams = [
      Stagehand.StagehandZodSchema,
      unknown,
    ];

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.validateZodSchema,
      ).parameters.branded.toEqualTypeOf<ExpectedValidateZodSchemaParams>();
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/timeout-error-types.test.ts
================================================
import { describe, expect, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

// ============================================================================
// Public Timeout Error Types Runtime Tests
// ============================================================================
// These tests verify the runtime behavior of exported timeout error types,
// complementing the type-level tests in public-error-types.test.ts

describe("Public timeout error types runtime behavior", () => {
  describe("ActTimeoutError", () => {
    it("is exported and extends Error", () => {
      const error = new Stagehand.ActTimeoutError(1000);
      expect(error).toBeInstanceOf(Error);
      expect(error).toBeInstanceOf(Stagehand.ActTimeoutError);
      expect(error.name).toBe("ActTimeoutError");
    });

    it("contains timeout value in milliseconds in message", () => {
      const error = new Stagehand.ActTimeoutError(500);
      expect(error.message).toContain("500ms");
    });

    it("contains operation name in message", () => {
      const error = new Stagehand.ActTimeoutError(100);
      expect(error.message).toContain("act()");
    });

    it("extends TimeoutError", () => {
      const error = new Stagehand.ActTimeoutError(1000);
      expect(error).toBeInstanceOf(Stagehand.TimeoutError);
    });
  });

  describe("ExtractTimeoutError", () => {
    it("is exported and extends Error", () => {
      const error = new Stagehand.ExtractTimeoutError(1000);
      expect(error).toBeInstanceOf(Error);
      expect(error).toBeInstanceOf(Stagehand.ExtractTimeoutError);
      expect(error.name).toBe("ExtractTimeoutError");
    });

    it("contains timeout value in milliseconds in message", () => {
      const error = new Stagehand.ExtractTimeoutError(1000);
      expect(error.message).toContain("1000ms");
    });

    it("contains operation name in message", () => {
      const error = new Stagehand.ExtractTimeoutError(100);
      expect(error.message).toContain("extract()");
    });

    it("extends TimeoutError", () => {
      const error = new Stagehand.ExtractTimeoutError(1000);
      expect(error).toBeInstanceOf(Stagehand.TimeoutError);
    });
  });

  describe("ObserveTimeoutError", () => {
    it("is exported and extends Error", () => {
      const error = new Stagehand.ObserveTimeoutError(1000);
      expect(error).toBeInstanceOf(Error);
      expect(error).toBeInstanceOf(Stagehand.ObserveTimeoutError);
      expect(error.name).toBe("ObserveTimeoutError");
    });

    it("contains timeout value in milliseconds in message", () => {
      const error = new Stagehand.ObserveTimeoutError(1500);
      expect(error.message).toContain("1500ms");
    });

    it("contains operation name in message", () => {
      const error = new Stagehand.ObserveTimeoutError(100);
      expect(error.message).toContain("observe()");
    });

    it("extends TimeoutError", () => {
      const error = new Stagehand.ObserveTimeoutError(1000);
      expect(error).toBeInstanceOf(Stagehand.TimeoutError);
    });
  });

  describe("TimeoutError (base class)", () => {
    it("is exported and extends Error", () => {
      const error = new Stagehand.TimeoutError("custom operation", 2000);
      expect(error).toBeInstanceOf(Error);
      expect(error).toBeInstanceOf(Stagehand.TimeoutError);
    });

    it("contains operation name and timeout in message", () => {
      const error = new Stagehand.TimeoutError("custom operation", 2000);
      expect(error.message).toContain("custom operation");
      expect(error.message).toContain("2000ms");
    });

    it("extends StagehandError", () => {
      const error = new Stagehand.TimeoutError("operation", 1000);
      expect(error).toBeInstanceOf(Stagehand.StagehandError);
    });
  });
});


================================================
FILE: packages/core/tests/unit/public-api/tool-type-export.test.ts
================================================
import { describe, expectTypeOf, it, expect } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";
import { type Tool } from "ai";
import { z } from "zod";

/**
 * Test to verify tool-related exports from Stagehand.
 * Users should be able to create custom tools using the exported `tool` function
 * without needing to install the ai package directly.
 */
describe("Tool exports from AI SDK", () => {
  it("exports Tool type that matches AI SDK Tool type", () => {
    expectTypeOf<Stagehand.Tool>().toEqualTypeOf<Tool>();
  });

  it("exports tool function", () => {
    expect(typeof Stagehand.tool).toBe("function");
  });

  it("tool function can be used to define custom tools", () => {
    const customTool = Stagehand.tool({
      description: "A test tool",
      inputSchema: z.object({
        input: z.string(),
      }),
      execute: async ({ input }) => {
        return { result: `Processed: ${input}` };
      },
    });

    expect(customTool).toBeDefined();
    expect(customTool.description).toBe("A test tool");
  });
});


================================================
FILE: packages/core/tests/unit/public-api/v3-core.test.ts
================================================
import { describe, expect, expectTypeOf, it } from "vitest";
import * as Stagehand from "@browserbasehq/stagehand";

describe("V3 Core public API types", () => {
  describe("Stagehand", () => {
    type ExpectedShape = {
      init: () => Promise<void>;
      close: (opts?: { force?: boolean }) => Promise<void>;
      act: (
        input: string | Stagehand.Action,
        options?: Stagehand.ActOptions,
      ) => Promise<Stagehand.ActResult>;
      extract: (...args: unknown[]) => Promise<unknown>;
      observe: (...args: unknown[]) => Promise<Stagehand.Action[]>;
      agent: (config?: Stagehand.AgentConfig) => {
        execute: (
          instructionOrOptions: string | Stagehand.AgentExecuteOptions,
        ) => Promise<Stagehand.AgentResult>;
      };
      connectURL: () => string;
      context: unknown;
      metrics: Promise<Stagehand.StagehandMetrics>;
      history: Promise<ReadonlyArray<Stagehand.HistoryEntry>>;
      llmClient: Stagehand.LLMClient;
      browserbaseSessionID: string | undefined;
      browserbaseSessionURL: string | undefined;
      browserbaseDebugURL: string | undefined;
      experimental: boolean;
      logInferenceToFile: boolean;
      verbose: 0 | 1 | 2;
      logger: (logLine: Stagehand.LogLine) => void;
      isAgentReplayActive: () => boolean;
      recordAgentReplayStep: (step: unknown) => void;
    };

    type StagehandInstance = InstanceType<typeof Stagehand.Stagehand>;

    it("has correct public interface shape", () => {
      expectTypeOf<StagehandInstance>().toExtend<ExpectedShape>();
    });

    it("act accepts Action as first parameter", () => {
      const mockAction = {} as Stagehand.Action;
      expectTypeOf<StagehandInstance["act"]>().toBeCallableWith(
        mockAction,
        {} as Stagehand.ActOptions,
      );
    });

    it("extract accepts instruction and schema", () => {
      const mockSchema = {} as Stagehand.StagehandZodSchema;
      expectTypeOf<StagehandInstance["extract"]>().toBeCallableWith(
        "instruction",
        mockSchema,
        {} as Stagehand.ExtractOptions,
      );
    });

    it("observe accepts instruction and options", () => {
      expectTypeOf<StagehandInstance["observe"]>().toBeCallableWith(
        "instruction",
        {} as Stagehand.ObserveOptions,
      );
    });

    it("agent execute accepts page option", () => {
      type AgentReturn = ReturnType<StagehandInstance["agent"]>;
      const mockPage = {} as Stagehand.AnyPage;
      expectTypeOf<AgentReturn["execute"]>().toBeCallableWith({
        instruction: "test",
        page: mockPage,
      } satisfies Stagehand.AgentExecuteOptions);
    });
  });

  describe("StagehandMetrics", () => {
    type ExpectedStagehandMetrics = {
      actPromptTokens: number;
      actCompletionTokens: number;
      actReasoningTokens: number;
      actCachedInputTokens: number;
      actInferenceTimeMs: number;
      extractPromptTokens: number;
      extractCompletionTokens: number;
      extractReasoningTokens: number;
      extractCachedInputTokens: number;
      extractInferenceTimeMs: number;
      observePromptTokens: number;
      observeCompletionTokens: number;
      observeReasoningTokens: number;
      observeCachedInputTokens: number;
      observeInferenceTimeMs: number;
      agentPromptTokens: number;
      agentCompletionTokens: number;
      agentReasoningTokens: number;
      agentCachedInputTokens: number;
      agentInferenceTimeMs: number;
      totalPromptTokens: number;
      totalCompletionTokens: number;
      totalReasoningTokens: number;
      totalCachedInputTokens: number;
      totalInferenceTimeMs: number;
    };

    it("matches the published metrics shape", () => {
      expectTypeOf<Stagehand.StagehandMetrics>().toEqualTypeOf<ExpectedStagehandMetrics>();
    });
  });

  describe("V3", () => {
    // V3 is the same class as Stagehand, just re-exported with a different name.
    // The public interface shape is already tested in the "Stagehand" test above.
    it("is exported", () => {
      expect(Stagehand.V3).toBeDefined();
    });
  });

  describe("V3Evaluator", () => {
    type V3EvaluatorInstance = InstanceType<typeof Stagehand.V3Evaluator>;

    it("is exported", () => {
      expect(Stagehand.V3Evaluator).toBeDefined();
    });

    it("has ask method", () => {
      expectTypeOf<V3EvaluatorInstance["ask"]>().toExtend<
        (options: unknown) => Promise<unknown>
      >();
    });

    it("has batchAsk method", () => {
      expectTypeOf<V3EvaluatorInstance["batchAsk"]>().toExtend<
        (options: unknown) => Promise<unknown[]>
      >();
    });
  });

  describe("V3FunctionName", () => {
    const expectedFunctionNames = [
      "ACT",
      "EXTRACT",
      "OBSERVE",
      "AGENT",
    ] as const;

    it("matches the known function name literals", () => {
      expectTypeOf<Stagehand.V3FunctionName>().toExtend<
        (typeof expectedFunctionNames)[number]
      >();
      void expectedFunctionNames; // Mark as used to satisfy ESLint
    });
  });

  describe("connectToMCPServer", () => {
    type ExpectedServerConfig =
      | string
      | URL
      | { command: string; args?: string[]; env?: Record<string, string> }
      | {
          serverUrl: string | URL;
          clientOptions?: unknown;
          requestOptions?: unknown;
        };

    it("has correct parameter types", () => {
      expectTypeOf(
        Stagehand.connectToMCPServer,
      ).parameters.branded.toEqualTypeOf<[ExpectedServerConfig]>();
    });
  });

  describe("LOG_LEVEL_NAMES", () => {
    type ExpectedLOG_LEVEL_NAMES = Record<Stagehand.LogLevel, string>;

    it("maps numeric levels to strings", () => {
      expectTypeOf<
        typeof Stagehand.LOG_LEVEL_NAMES
      >().toExtend<ExpectedLOG_LEVEL_NAMES>();
    });
  });
});


================================================
FILE: packages/core/tests/unit/safety-confirmation.test.ts
================================================
import { describe, it, expect, vi } from "vitest";
import { OpenAICUAClient } from "../../lib/v3/agent/OpenAICUAClient.js";
import { GoogleCUAClient } from "../../lib/v3/agent/GoogleCUAClient.js";
import type {
  SafetyCheck,
  SafetyConfirmationHandler,
} from "../../lib/v3/types/public/agent.js";
import type { LogLine } from "../../lib/v3/types/public/logs.js";

type LoggerMock = (message: LogLine) => void;

const openAISafetyInvoker = (
  OpenAICUAClient.prototype as unknown as {
    handleSafetyConfirmation: (
      this: OpenAICUAClient,
      pendingSafetyChecks: SafetyCheck[],
      logger: LoggerMock,
    ) => Promise<SafetyCheck[] | undefined>;
  }
).handleSafetyConfirmation;

const googleSafetyInvoker = (
  GoogleCUAClient.prototype as unknown as {
    handleSafetyConfirmation: (
      this: GoogleCUAClient,
      safetyDecision: unknown,
      logger: LoggerMock,
    ) => Promise<string | undefined>;
  }
).handleSafetyConfirmation;

function createOpenAIClient(): OpenAICUAClient {
  return new OpenAICUAClient(
    "openai",
    "openai/computer-use-preview",
    "test instructions",
    { apiKey: "test" },
  );
}

function createGoogleClient(): GoogleCUAClient {
  return new GoogleCUAClient(
    "google",
    "google/gemini-2.5-computer-use-preview-10-2025",
    "test instructions",
    { apiKey: "test" },
  );
}

describe("Safety Confirmation Handler", () => {
  describe("OpenAI-style (pending_safety_checks)", () => {
    const mockChecks: SafetyCheck[] = [
      {
        id: "check-1",
        code: "malicious_instructions",
        message: "Potentially harmful action detected",
      },
    ];

    it("returns checks when handler acknowledges", async () => {
      const client = createOpenAIClient();
      const handler: SafetyConfirmationHandler = vi.fn(async () => ({
        acknowledged: true,
      }));
      client.setSafetyConfirmationHandler(handler);
      const logger = vi.fn<LoggerMock>();
      const result = await openAISafetyInvoker.call(client, mockChecks, logger);

      expect(handler).toHaveBeenCalledWith(mockChecks);
      expect(result).toEqual(mockChecks);
    });

    it("returns undefined when handler rejects", async () => {
      const client = createOpenAIClient();
      const handler: SafetyConfirmationHandler = vi.fn(async () => ({
        acknowledged: false,
      }));
      client.setSafetyConfirmationHandler(handler);
      const logger = vi.fn<LoggerMock>();
      const result = await openAISafetyInvoker.call(client, mockChecks, logger);

      expect(handler).toHaveBeenCalledWith(mockChecks);
      expect(result).toBeUndefined();
    });

    it("auto-acknowledges when no handler is set", async () => {
      const client = createOpenAIClient();
      const logger = vi.fn<LoggerMock>();
      const result = await openAISafetyInvoker.call(client, mockChecks, logger);
      expect(result).toEqual(mockChecks);
    });
  });

  describe("Google-style (safety_decision)", () => {
    const mockDecision = {
      decision: "require_confirmation",
      explanation: "Cookie consent dialog detected",
    };

    it("returns 'true' when handler acknowledges", async () => {
      const client = createGoogleClient();
      const handler: SafetyConfirmationHandler = vi.fn(async () => ({
        acknowledged: true,
      }));
      client.setSafetyConfirmationHandler(handler);
      const logger = vi.fn<LoggerMock>();
      const result = await googleSafetyInvoker.call(
        client,
        mockDecision,
        logger,
      );

      expect(handler).toHaveBeenCalledWith([
        {
          id: "google-safety-decision",
          code: "safety_decision",
          message: JSON.stringify(mockDecision, null, 2),
        },
      ]);
      expect(result).toBe("true");
    });

    it("returns undefined when handler rejects", async () => {
      const client = createGoogleClient();
      const handler: SafetyConfirmationHandler = vi.fn(async () => ({
        acknowledged: false,
      }));
      client.setSafetyConfirmationHandler(handler);
      const logger = vi.fn<LoggerMock>();
      const result = await googleSafetyInvoker.call(
        client,
        mockDecision,
        logger,
      );

      expect(handler).toHaveBeenCalled();
      expect(result).toBeUndefined();
    });

    it("auto-acknowledges when no handler is set", async () => {
      const client = createGoogleClient();
      const logger = vi.fn<LoggerMock>();
      const result = await googleSafetyInvoker.call(
        client,
        mockDecision,
        logger,
      );
      expect(result).toBe("true");
    });

    it("handles string safety decisions", async () => {
      const client = createGoogleClient();
      const handler: SafetyConfirmationHandler = vi.fn(async () => ({
        acknowledged: true,
      }));
      client.setSafetyConfirmationHandler(handler);
      const logger = vi.fn<LoggerMock>();
      const result = await googleSafetyInvoker.call(
        client,
        "Simple string decision",
        logger,
      );

      expect(handler).toHaveBeenCalledWith([
        {
          id: "google-safety-decision",
          code: "safety_decision",
          message: "Simple string decision",
        },
      ]);
      expect(result).toBe("true");
    });
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-a11y-resolvers.test.ts
================================================
import type { Protocol } from "devtools-protocol";
import { beforeEach, describe, expect, it, vi } from "vitest";
import { a11yForFrame } from "../../lib/v3/understudy/a11y/snapshot/a11yTree.js";
import type { AccessibilityTreeResult } from "../../lib/v3/types/private/index.js";
import * as focusSelectors from "../../lib/v3/understudy/a11y/snapshot/focusSelectors.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";
import { executionContexts } from "../../lib/v3/understudy/executionContextRegistry.js";
import { tryScopedSnapshot } from "../../lib/v3/understudy/a11y/snapshot/capture.js";
import type {
  FrameContext,
  A11yOptions,
} from "../../lib/v3/types/private/index.js";
import type { Page } from "../../lib/v3/understudy/page.js";
import * as domTree from "../../lib/v3/understudy/a11y/snapshot/domTree.js";
import * as a11yTree from "../../lib/v3/understudy/a11y/snapshot/a11yTree.js";
import * as logger from "../../lib/v3/logger.js";

const stringType = "string" as Protocol.Accessibility.AXValueType;

const baseAxNodes = (): Protocol.Accessibility.AXNode[] => [
  {
    nodeId: "1",
    role: { type: stringType, value: "RootWebArea" },
    backendDOMNodeId: 100,
    childIds: ["2"],
    ignored: false,
  },
  {
    nodeId: "2",
    role: { type: stringType, value: "link" },
    name: { type: stringType, value: "Docs" },
    backendDOMNodeId: 101,
    parentId: "1",
    childIds: [],
    properties: [
      {
        name: "url",
        value: { type: stringType, value: "https://example.com" },
      },
    ],
    ignored: false,
  },
];

const baseHandlers = {
  "Accessibility.enable": async () => ({}),
  "Runtime.enable": async () => ({}),
  "DOM.enable": async () => ({}),
};

describe("a11yForFrame", () => {
  beforeEach(() => {
    vi.restoreAllMocks();
  });

  it("returns full outline and url map when no focus selector is provided", async () => {
    const session = new MockCDPSession({
      ...baseHandlers,
      "Accessibility.getFullAXTree": async () => ({ nodes: baseAxNodes() }),
    });

    const opts: A11yOptions = {
      focusSelector: undefined,
      experimental: false,
      tagNameMap: { "enc-100": "#document", "enc-101": "a" },
      scrollableMap: {},
      encode: (backend) => `enc-${backend}`,
    };

    const result = await a11yForFrame(session, undefined, opts);

    expect(result.scopeApplied).toBe(false);
    expect(result.urlMap["enc-101"]).toBe("https://example.com");
    expect(result.outline).toContain("Docs");
  });

  it("scopes the tree to the resolved focus selector target", async () => {
    const nodes = baseAxNodes().map((n) =>
      n.nodeId === "2"
        ? {
            ...n,
            childIds: ["3"],
          }
        : n,
    );
    nodes.push({
      nodeId: "3",
      parentId: "2",
      childIds: [],
      role: { type: stringType, value: "StaticText" },
      backendDOMNodeId: 102,
      ignored: false,
    });

    let scopedOnce = false;
    const session = new MockCDPSession({
      ...baseHandlers,
      "Accessibility.getFullAXTree": async (params) => {
        if (params?.frameId && !scopedOnce) {
          scopedOnce = true;
          throw new Error("does not belong to the target");
        }
        return { nodes };
      },
      "DOM.describeNode": async () => ({
        node: { backendNodeId: 101 },
      }),
    });

    const resolveSpy = vi
      .spyOn(focusSelectors, "resolveObjectIdForXPath")
      .mockResolvedValue("object-1");

    const opts: A11yOptions = {
      focusSelector: "xpath=//a",
      experimental: false,
      tagNameMap: { "enc-101": "a" },
      scrollableMap: {},
      encode: (backend) => `enc-${backend}`,
    };

    const result = await a11yForFrame(session, "frame-1", opts);

    expect(result.scopeApplied).toBe(true);
    expect(result.outline).not.toContain("RootWebArea");
    expect(resolveSpy).toHaveBeenCalled();
    resolveSpy.mockRestore();
  });

  it("falls back to full tree when resolveObjectId throws", async () => {
    const session = new MockCDPSession({
      ...baseHandlers,
      "Accessibility.getFullAXTree": async () => ({ nodes: baseAxNodes() }),
    });
    vi.spyOn(focusSelectors, "resolveObjectIdForCss").mockRejectedValue(
      new Error("fail"),
    );
    const opts: A11yOptions = {
      focusSelector: ".btn",
      experimental: false,
      tagNameMap: {},
      scrollableMap: {},
      encode: (backend) => `enc-${backend}`,
    };

    const result = await a11yForFrame(session, "frame-1", opts);
    expect(result.scopeApplied).toBe(false);
  });
});

describe("resolveObjectIdForXPath", () => {
  beforeEach(() => {
    vi.restoreAllMocks();
  });

  it("evaluates in the target frame's main world when available", async () => {
    vi.spyOn(executionContexts, "waitForMainWorld").mockResolvedValue(42);
    vi.spyOn(executionContexts, "getMainWorld").mockReturnValue(undefined);
    const session = new MockCDPSession({
      "Runtime.evaluate": async (params) => {
        expect(params?.contextId).toBe(42);
        return { result: { objectId: "node-obj" } };
      },
    });

    const objectId = await focusSelectors.resolveObjectIdForXPath(
      session,
      "//div",
      "frame-1",
    );
    expect(objectId).toBe("node-obj");
  });

  it("returns null when evaluation throws or reports exception details", async () => {
    vi.spyOn(executionContexts, "waitForMainWorld").mockRejectedValue(
      new Error("missing"),
    );
    vi.spyOn(executionContexts, "getMainWorld").mockReturnValue(undefined);
    const session = new MockCDPSession({
      "Runtime.evaluate": async () => ({
        result: {},
        exceptionDetails: { exception: { description: "bad" } },
      }),
    });

    const objectId = await focusSelectors.resolveObjectIdForXPath(
      session,
      "//div",
      "frame-2",
    );
    expect(objectId).toBeNull();
  });
});

describe("resolveObjectIdForCss", () => {
  beforeEach(() => {
    vi.restoreAllMocks();
  });

  it("returns primary evaluation result when available", async () => {
    vi.spyOn(executionContexts, "waitForMainWorld").mockResolvedValue(7);
    const session = new MockCDPSession({
      "Runtime.evaluate": async () => ({
        result: { objectId: "primary-obj" },
      }),
    });
    const objectId = await focusSelectors.resolveObjectIdForCss(
      session,
      ".btn",
      "frame-1",
    );
    expect(objectId).toBe("primary-obj");
  });

  it("falls back to the pierce selector when the primary lookup fails", async () => {
    let call = 0;
    const session = new MockCDPSession({
      "Runtime.evaluate": async (params) => {
        call++;
        if (call === 1) {
          expect(String(params?.expression)).toContain("resolveCssSelector");
          return { result: {} };
        }
        expect(String(params?.expression)).toContain(
          "resolveCssSelectorPierce",
        );
        return { result: { objectId: "css-obj" } };
      },
    });

    const objectId = await focusSelectors.resolveObjectIdForCss(
      session,
      ".btn",
      undefined,
    );
    expect(objectId).toBe("css-obj");
  });

  it("returns null when both primary and fallback evaluations throw", async () => {
    vi.spyOn(executionContexts, "waitForMainWorld").mockResolvedValue(11);
    vi.spyOn(executionContexts, "getMainWorld").mockReturnValue(undefined);
    const session = new MockCDPSession({
      "Runtime.evaluate": async () => ({
        result: {},
        exceptionDetails: { exception: { description: "fail" } },
      }),
    });

    const objectId = await focusSelectors.resolveObjectIdForCss(
      session,
      ".missing",
      "frame-1",
    );
    expect(objectId).toBeNull();
  });
});

describe("tryScopedSnapshot", () => {
  const ordinal = (frameId: string) => (frameId === "frame-1" ? 0 : 1);
  const context: FrameContext = {
    rootId: "frame-1",
    frames: ["frame-1", "frame-2"],
    parentByFrame: new Map([
      ["frame-1", null],
      ["frame-2", "frame-1"],
    ]),
  };

  const makePage = (session: MockCDPSession, overrides?: Partial<Page>): Page =>
    ({
      mainFrameId: () => "frame-1",
      asProtocolFrameTree: () => ({
        frame: { id: "frame-1" as Protocol.Page.FrameId },
        childFrames: [{ frame: { id: "frame-2" as Protocol.Page.FrameId } }],
      }),
      listAllFrameIds: () => ["frame-1", "frame-2"],
      getSessionForFrame: () => session,
      getOrdinal: (fid: string) => ordinal(fid),
      ...overrides,
    }) as unknown as Page;

  beforeEach(() => {
    vi.restoreAllMocks();
  });

  it("returns scoped snapshot when focus selector resolves via CSS hops", async () => {
    const session = new MockCDPSession({});
    const domMapsSpy = vi
      .spyOn(domTree, "domMapsForSession")
      .mockResolvedValue({
        tagNameMap: { "1-10": "div" },
        xpathMap: { "1-10": "/div[1]" },
        scrollableMap: {},
      });
    const a11ySpy = vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "[1-10] div",
      urlMap: { "1-10": "https://example.com" },
      scopeApplied: true,
    } as AccessibilityTreeResult);
    vi.spyOn(focusSelectors, "resolveCssFocusFrameAndTail").mockResolvedValue({
      targetFrameId: "frame-2",
      tailSelector: ".btn-inner",
      absPrefix: "/html/body/iframe[1]",
    });

    const result = await tryScopedSnapshot(
      makePage(session),
      { focusSelector: ".btn" },
      context,
      true,
    );

    expect(result).not.toBeNull();
    expect(result?.combinedXpathMap["1-10"]).toBe(
      "/html/body/iframe[1]/div[1]",
    );
    expect(domMapsSpy).toHaveBeenCalled();
    expect(a11ySpy).toHaveBeenCalled();
  });

  it("returns null and logs fallback when scope is not applied", async () => {
    const session = new MockCDPSession({});
    vi.spyOn(domTree, "domMapsForSession").mockResolvedValue({
      tagNameMap: { "1-10": "div" },
      xpathMap: { "1-10": "/div[1]" },
      scrollableMap: {},
    });
    vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "ignored",
      urlMap: {},
      scopeApplied: false,
    } as AccessibilityTreeResult);
    const loggerSpy = vi.spyOn(logger, "v3Logger").mockImplementation(() => {});

    const result = await tryScopedSnapshot(
      makePage(session),
      { focusSelector: ".btn" },
      context,
      false,
    );

    expect(result).toBeNull();
    expect(loggerSpy).toHaveBeenCalled();
  });

  it("returns null immediately when no focus selector is provided", async () => {
    const result = await tryScopedSnapshot(
      makePage(new MockCDPSession({})),
      {},
      context,
      true,
    );
    expect(result).toBeNull();
  });

  it("supports XPath focus resolution branch", async () => {
    const session = new MockCDPSession({});
    vi.spyOn(domTree, "domMapsForSession").mockResolvedValue({
      tagNameMap: { "1-10": "div" },
      xpathMap: { "1-10": "/div[1]" },
      scrollableMap: {},
    });
    vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "[1-10] div",
      urlMap: {},
      scopeApplied: true,
    } as AccessibilityTreeResult);
    vi.spyOn(focusSelectors, "resolveFocusFrameAndTail").mockResolvedValue({
      targetFrameId: "frame-1",
      tailXPath: "//div[1]",
      absPrefix: "",
    });

    const result = await tryScopedSnapshot(
      makePage(session),
      { focusSelector: "xpath=//div" },
      context,
      true,
    );

    expect(result).not.toBeNull();
    expect(result?.combinedXpathMap["1-10"]).toBe("/div[1]");
  });

  it("logs and returns null when resolver throws", async () => {
    const session = new MockCDPSession({});
    vi.spyOn(focusSelectors, "resolveCssFocusFrameAndTail").mockRejectedValue(
      new Error("bad selector"),
    );
    const loggerSpy = vi.spyOn(logger, "v3Logger").mockImplementation(() => {});

    const result = await tryScopedSnapshot(
      makePage(session),
      { focusSelector: ".bad" },
      context,
      true,
    );

    expect(result).toBeNull();
    expect(loggerSpy).toHaveBeenCalled();
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-a11y-tree-utils.test.ts
================================================
import type { Protocol } from "devtools-protocol";
import { describe, expect, it } from "vitest";
import type {
  A11yNode,
  A11yOptions,
} from "../../lib/v3/types/private/snapshot.js";
import {
  buildHierarchicalTree,
  decorateRoles,
  extractUrlFromAXNode,
  isStructural,
  removeRedundantStaticTextChildren,
} from "../../lib/v3/understudy/a11y/snapshot/a11yTree.js";

const axString = (value: string): Protocol.Accessibility.AXValue => ({
  type: "string",
  value,
});

const defaultOpts: A11yOptions = {
  focusSelector: undefined,
  experimental: false,
  tagNameMap: {},
  scrollableMap: {},
  encode: (backendNodeId: number) => `enc-${backendNodeId}`,
};

const makeAxNode = (
  overrides: Partial<Protocol.Accessibility.AXNode> = {},
): Protocol.Accessibility.AXNode => ({
  nodeId: overrides.nodeId ?? String(Math.random()),
  backendDOMNodeId:
    overrides.backendDOMNodeId ?? Math.floor(Math.random() * 1e6),
  role: overrides.role ?? axString("generic"),
  childIds: overrides.childIds ?? [],
  parentId: overrides.parentId,
  properties: overrides.properties ?? [],
  name: overrides.name,
  description: overrides.description,
  value: overrides.value,
  ignored: overrides.ignored ?? false,
});

describe("decorateRoles", () => {
  it("marks scrollable DOM nodes with tag labels and encoded ids", () => {
    const opts: A11yOptions = {
      ...defaultOpts,
      tagNameMap: {
        "enc-1": "div",
        "enc-2": "html",
        "enc-3": "#document",
        "enc-4": "#svg",
      },
      scrollableMap: { "enc-1": true, "enc-4": true },
    };
    const nodes = [
      makeAxNode({
        backendDOMNodeId: 1,
        role: { type: "string", value: "region" },
      }),
      makeAxNode({
        backendDOMNodeId: 2,
        role: { type: "string", value: "generic" },
      }),
      makeAxNode({
        backendDOMNodeId: 3,
        role: { type: "string", value: "generic" },
      }),
      makeAxNode({
        backendDOMNodeId: 4,
        role: { type: "string", value: "generic" },
      }),
    ];

    const decorated = decorateRoles(nodes, opts);
    expect(decorated).toMatchObject([
      { encodedId: "enc-1", role: "scrollable, div" },
      { encodedId: "enc-2", role: "scrollable, html" },
      { encodedId: "enc-3", role: "generic" },
      { encodedId: "enc-4", role: "scrollable, svg" },
    ]);
  });

  it("falls back when encoding fails", () => {
    const opts: A11yOptions = {
      ...defaultOpts,
      encode: () => {
        throw new Error("boom");
      },
    };
    const nodes = [makeAxNode({ backendDOMNodeId: 4 })];
    const decorated = decorateRoles(nodes, opts);
    expect(decorated[0]?.encodedId).toBeUndefined();
  });
});

describe("buildHierarchicalTree", () => {
  const opts: A11yOptions = {
    ...defaultOpts,
    tagNameMap: { root: "div", child: "span" },
  };

  it("drops structural nodes without children or names", async () => {
    const nodes: A11yNode[] = [
      {
        role: "generic",
        name: "",
        nodeId: "root",
        encodedId: "root",
        parentId: undefined,
        childIds: ["child"],
      },
      {
        role: "generic",
        name: "",
        nodeId: "child",
        encodedId: "child",
        parentId: "root",
        childIds: [],
      },
    ];

    const { tree } = await buildHierarchicalTree(nodes, opts);
    expect(tree).toEqual([]);
  });

  it("promotes select/combobox tag names for structural nodes", async () => {
    const nodes: A11yNode[] = [
      {
        role: "combobox",
        name: "Select",
        nodeId: "root",
        encodedId: "root",
        parentId: undefined,
        childIds: ["child"],
      },
      {
        role: "StaticText",
        name: "Option",
        nodeId: "child",
        encodedId: "child",
        parentId: "root",
        childIds: [],
      },
    ];

    const { tree } = await buildHierarchicalTree(nodes, {
      ...opts,
      tagNameMap: { root: "select" },
    });
    expect(tree[0]?.role).toBe("select");
  });

  it("drops structural parents with a single cleaned child while keeping it in place", async () => {
    const nodes: A11yNode[] = [
      {
        role: "generic",
        name: "",
        nodeId: "root",
        encodedId: "root",
        parentId: undefined,
        childIds: ["child"],
      },
      {
        role: "StaticText",
        name: "Ok",
        nodeId: "child",
        encodedId: "child",
        parentId: "root",
        childIds: [],
      },
    ];

    const { tree } = await buildHierarchicalTree(nodes, opts);
    expect(tree[0]?.role).toBe("StaticText");
  });

  it("drops structural parents entirely when all descendants are pruned", async () => {
    const nodes: A11yNode[] = [
      {
        role: "generic",
        name: "",
        nodeId: "root",
        encodedId: "root",
        parentId: undefined,
        childIds: ["child"],
      },
      {
        role: "generic",
        name: "",
        nodeId: "child",
        encodedId: "child",
        parentId: "root",
        childIds: [],
      },
    ];

    const { tree } = await buildHierarchicalTree(nodes, opts);
    expect(tree).toEqual([]);
  });

  it("renames structural nodes to their tag names when not combobox", async () => {
    const nodes: A11yNode[] = [
      {
        role: "generic",
        name: "Container",
        nodeId: "root",
        encodedId: "root",
        parentId: undefined,
        childIds: ["child-a", "child-b"],
      },
      {
        role: "StaticText",
        name: "A",
        nodeId: "child-a",
        encodedId: "child-a",
        parentId: "root",
        childIds: [],
      },
      {
        role: "StaticText",
        name: "B",
        nodeId: "child-b",
        encodedId: "child-b",
        parentId: "root",
        childIds: [],
      },
    ];

    const { tree } = await buildHierarchicalTree(nodes, {
      ...opts,
      tagNameMap: { root: "section" },
    });
    expect(tree[0]?.role).toBe("section");
  });

  it("skips nodes with negative node ids early", async () => {
    const nodes: A11yNode[] = [
      {
        role: "button",
        name: "Hidden",
        nodeId: "-1",
        encodedId: "hidden",
        parentId: undefined,
        childIds: [],
      },
    ];

    const { tree } = await buildHierarchicalTree(nodes, opts);
    expect(tree).toEqual([]);
  });
});

describe("isStructural", () => {
  it("marks generic/none/InlineTextBox roles as structural", () => {
    expect(isStructural("generic")).toBe(true);
    expect(isStructural("none")).toBe(true);
    expect(isStructural("InlineTextBox")).toBe(true);
    expect(isStructural("button")).toBe(false);
  });
});

describe("removeRedundantStaticTextChildren", () => {
  it("removes static text children whose concatenated text equals the parent name", () => {
    const parent: A11yNode = {
      role: "button",
      name: "HelloWorld",
      nodeId: "root",
    };
    const children: A11yNode[] = [
      { role: "StaticText", name: "Hello", nodeId: "c1" },
      { role: "StaticText", name: "World", nodeId: "c2" },
      { role: "button", name: "Child", nodeId: "c3" },
    ];
    const pruned = removeRedundantStaticTextChildren(parent, children);
    expect(pruned).toEqual([{ role: "button", name: "Child", nodeId: "c3" }]);
  });

  it("keeps static text when combined text differs", () => {
    const parent: A11yNode = {
      role: "button",
      name: "Hello World",
      nodeId: "root",
    };
    const children: A11yNode[] = [
      { role: "StaticText", name: "Hello", nodeId: "c1" },
      { role: "StaticText", name: "Mars", nodeId: "c2" },
    ];
    expect(removeRedundantStaticTextChildren(parent, children)).toEqual(
      children,
    );
  });
  it("returns original children when parent name is empty", () => {
    const parent: A11yNode = {
      role: "button",
      nodeId: "root",
    };
    const children: A11yNode[] = [
      { role: "StaticText", name: "Hello", nodeId: "c1" },
      { role: "StaticText", name: "World", nodeId: "c2" },
    ];
    expect(removeRedundantStaticTextChildren(parent, children)).toEqual(
      children,
    );
  });
});

describe("extractUrlFromAXNode", () => {
  it("returns trimmed URL string from node properties", () => {
    const node = makeAxNode({
      properties: [
        { name: "busy", value: axString("bar") },
        { name: "url", value: axString(" https://example.com ") },
      ],
    });
    expect(extractUrlFromAXNode(node)).toBe("https://example.com");
  });

  it("returns undefined when url property missing or invalid", () => {
    expect(
      extractUrlFromAXNode(makeAxNode({ properties: [] })),
    ).toBeUndefined();
    expect(
      extractUrlFromAXNode(
        makeAxNode({
          properties: [{ name: "url", value: { type: "number", value: 123 } }],
        }),
      ),
    ).toBeUndefined();
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-capture-orchestration.test.ts
================================================
import type { Protocol } from "devtools-protocol";
import { beforeEach, describe, expect, it, vi } from "vitest";
import type { CDPSessionLike } from "../../lib/v3/understudy/cdp.js";
import type { Page } from "../../lib/v3/understudy/page.js";
import type {
  FrameContext,
  SessionDomIndex,
} from "../../lib/v3/types/private/index.js";
import * as capture from "../../lib/v3/understudy/a11y/snapshot/capture.js";
import * as a11yTree from "../../lib/v3/understudy/a11y/snapshot/a11yTree.js";
import * as domTree from "../../lib/v3/understudy/a11y/snapshot/domTree.js";
import * as focusSelectors from "../../lib/v3/understudy/a11y/snapshot/focusSelectors.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";

const makeProtocolFrame = (id: string): Protocol.Page.Frame =>
  ({
    id,
    loaderId: `${id}-loader`,
    url: "https://example.com",
    securityOrigin: "https://example.com",
    mimeType: "text/html",
  }) as unknown as Protocol.Page.Frame;

const makeFrameTree = (
  id: string,
  children: Protocol.Page.FrameTree[] = [],
): Protocol.Page.FrameTree => ({
  frame: makeProtocolFrame(id),
  childFrames: children,
});

type PageStub = Pick<
  Page,
  | "mainFrameId"
  | "asProtocolFrameTree"
  | "listAllFrameIds"
  | "getSessionForFrame"
  | "getOrdinal"
>;

const makePage = (overrides: Partial<PageStub> = {}): Page => {
  const defaultSession = new MockCDPSession({}, "default-session");
  const base: PageStub = {
    mainFrameId: () => "frame-1",
    asProtocolFrameTree: () => makeFrameTree("frame-1"),
    listAllFrameIds: () => ["frame-1"],
    getSessionForFrame: () => defaultSession,
    getOrdinal: () => 0,
  };
  return { ...base, ...overrides } as unknown as Page;
};

const makeSessionIndex = (): SessionDomIndex => ({
  rootBackend: 100,
  absByBe: new Map([
    [100, "/"],
    [101, "/html[1]"],
    [102, "/html[1]/body[1]"],
    [150, "/html[1]/body[1]/iframe[1]"],
    [200, "/html[1]/body[1]/iframe[1]"],
    [201, "/html[1]/body[1]/iframe[1]/div[1]"],
  ]),
  tagByBe: new Map([
    [100, "#document"],
    [101, "html"],
    [102, "body"],
    [150, "iframe"],
    [200, "#document"],
    [201, "div"],
  ]),
  scrollByBe: new Map([[201, true]]),
  docRootOf: new Map([
    [100, 100],
    [101, 100],
    [102, 100],
    [150, 100],
    [200, 200],
    [201, 200],
  ]),
  contentDocRootByIframe: new Map([[150, 200]]),
});

beforeEach(() => {
  vi.restoreAllMocks();
});

describe("buildFrameContext", () => {
  it("indexes parent relationships from the frame tree", () => {
    const frameTree = makeFrameTree("frame-1", [
      makeFrameTree("frame-2", [makeFrameTree("frame-3")]),
      makeFrameTree("frame-4"),
    ]);
    const page = makePage({
      asProtocolFrameTree: () => frameTree,
      listAllFrameIds: () => ["frame-1", "frame-2", "frame-3", "frame-4"],
    });

    const context = capture.buildFrameContext(page);

    expect(context.rootId).toBe("frame-1");
    expect(context.frames).toEqual([
      "frame-1",
      "frame-2",
      "frame-3",
      "frame-4",
    ]);
    expect(context.parentByFrame.get("frame-1")).toBeNull();
    expect(context.parentByFrame.get("frame-2")).toBe("frame-1");
    expect(context.parentByFrame.get("frame-3")).toBe("frame-2");
    expect(context.parentByFrame.get("frame-4")).toBe("frame-1");
  });
});

describe("buildSessionIndexes", () => {
  it("deduplicates frames that share the same CDP session id", async () => {
    const session = new MockCDPSession({}, "session-a");
    const page = makePage({
      // Every frame lookup returns the same session instance, so buildSessionIndexes
      // should call buildSessionDomIndex only once and reuse the result.
      getSessionForFrame: () => session,
    });
    const idx = makeSessionIndex();
    const spy = vi
      .spyOn(domTree, "buildSessionDomIndex")
      .mockResolvedValue(idx);

    const result = await capture.buildSessionIndexes(
      page,
      ["frame-1", "frame-2"],
      true,
    );

    expect(spy).toHaveBeenCalledTimes(1); // only one DOM.getDocument per session id
    expect(spy).toHaveBeenCalledWith(session, true);
    expect(result.get("session-a")).toBe(idx);
  });

  it("builds indexes for sessions without ids using the 'root' key", async () => {
    const sessionWithoutId: CDPSessionLike = {
      id: undefined,
      async send<R = unknown>(
        _method: string,
        _params?: Record<string, unknown>,
      ): Promise<R> {
        void _method;
        void _params;
        return {} as R;
      },
      on() {},
      off() {},
      async close() {},
    };
    const sessionWithId = new MockCDPSession({}, "child-session");
    const page = makePage({
      getSessionForFrame: (frameId: string) =>
        frameId === "frame-1" ? sessionWithoutId : sessionWithId,
    });

    const idxA = makeSessionIndex();
    const idxB = makeSessionIndex();
    const spy = vi
      .spyOn(domTree, "buildSessionDomIndex")
      .mockResolvedValueOnce(idxA)
      .mockResolvedValueOnce(idxB);

    const result = await capture.buildSessionIndexes(
      page,
      ["frame-1", "frame-2"],
      false,
    );

    // Verifies the helper invokes buildSessionDomIndex once for each unique session,
    // keying anonymous sessions as "root" so downstream lookups remain stable.
    expect(spy).toHaveBeenNthCalledWith(1, sessionWithoutId, false);
    expect(spy).toHaveBeenNthCalledWith(2, sessionWithId, false);
    expect(result.get("root")).toBe(idxA);
    expect(result.get("child-session")).toBe(idxB);
  });
});

describe("collectPerFrameMaps", () => {
  it("builds per-frame xpath/tag maps and outlines from a shared session index", async () => {
    const session = new MockCDPSession(
      {
        "DOM.getFrameOwner": async () => ({ backendNodeId: 150 }),
      },
      "session-a",
    );
    const page = makePage({
      getSessionForFrame: () => session,
      getOrdinal: (frameId: string) => (frameId === "frame-1" ? 0 : 1),
    });
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };
    const sessionIndex = makeSessionIndex();
    const sessionToIndex = new Map([[session.id, sessionIndex]]);

    vi.spyOn(a11yTree, "a11yForFrame").mockImplementation(
      async (_sess, frameId) => ({
        outline: `outline-${frameId}`,
        urlMap: { [`url-${frameId}`]: `https://${frameId}.test` },
        scopeApplied: false,
      }),
    );

    const result = await capture.collectPerFrameMaps(
      page,
      context,
      sessionToIndex,
      { experimental: true },
      true,
      context.frames,
    );

    expect(result.perFrameOutlines).toEqual([
      { frameId: "frame-1", outline: "outline-frame-1" },
      { frameId: "frame-2", outline: "outline-frame-2" },
    ]);
    const rootMaps = result.perFrameMaps.get("frame-1");
    expect(rootMaps?.xpathMap["0-100"]).toBe("/");
    expect(rootMaps?.xpathMap["0-101"]).toBe("/html[1]");
    expect(rootMaps?.xpathMap["0-102"]).toBe("/html[1]/body[1]");
    const childMaps = result.perFrameMaps.get("frame-2");
    expect(childMaps?.xpathMap["1-200"]).toBe("/");
    expect(childMaps?.xpathMap["1-201"]).toBe("/div[1]");
    expect(childMaps?.scrollableMap["1-201"]).toBe(true);
    expect(childMaps?.urlMap).toEqual({
      "url-frame-2": "https://frame-2.test",
    });
    expect(session.callsFor("DOM.getFrameOwner")).toHaveLength(1);
  });

  it("builds a missing session index on demand and memoizes it", async () => {
    const session = new MockCDPSession({}, "new-session");
    const page = makePage({
      getSessionForFrame: () => session,
      getOrdinal: () => 2,
    });
    const context: FrameContext = {
      rootId: "frame-9",
      frames: ["frame-9"],
      parentByFrame: new Map([["frame-9", null]]),
    };
    const idx = makeSessionIndex();
    const buildSpy = vi
      .spyOn(domTree, "buildSessionDomIndex")
      .mockResolvedValue(idx);
    vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "outline",
      urlMap: {},
      scopeApplied: false,
    });

    const sessionToIndex = new Map<string, SessionDomIndex>();
    const result = await capture.collectPerFrameMaps(
      page,
      context,
      sessionToIndex,
      undefined,
      false,
      context.frames,
    );

    expect(buildSpy).toHaveBeenCalledWith(session, false);
    expect(sessionToIndex.get("new-session")).toBe(idx);
    expect(result.perFrameMaps.get("frame-9")?.xpathMap["2-100"]).toBe("/");
  });

  it("skips frames that are not listed in the frameIds argument", async () => {
    const session = new MockCDPSession({}, "session-a");
    const page = makePage({
      getSessionForFrame: () => session,
      getOrdinal: (frameId: string) => (frameId === "frame-1" ? 0 : 1),
    });
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };
    const sessionIndex = makeSessionIndex();
    const sessionToIndex = new Map([[session.id, sessionIndex]]);

    const a11ySpy = vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "outline",
      urlMap: {},
      scopeApplied: false,
    });

    const result = await capture.collectPerFrameMaps(
      page,
      context,
      sessionToIndex,
      undefined,
      true,
      ["frame-1"],
    );

    expect(a11ySpy).toHaveBeenCalledTimes(1);
    expect(result.perFrameMaps.has("frame-2")).toBe(false);
    expect(result.perFrameOutlines.map((o) => o.frameId)).toEqual(["frame-1"]);
  });
});

describe("captureHybridSnapshot", () => {
  it("returns early when the scoped snapshot path succeeds", async () => {
    const session = new MockCDPSession({}, "session-a");
    const page = makePage({
      getSessionForFrame: () => session,
    });
    const options = { focusSelector: "/html" };

    vi.spyOn(focusSelectors, "resolveFocusFrameAndTail").mockResolvedValue({
      targetFrameId: "frame-1",
      tailXPath: "",
      absPrefix: "",
    });
    const domMapsSpy = vi
      .spyOn(domTree, "domMapsForSession")
      .mockResolvedValue({
        tagNameMap: { "0-100": "#document" },
        xpathMap: { "0-100": "/" },
        scrollableMap: {},
      });
    const a11ySpy = vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "scoped outline",
      urlMap: { "0-100": "https://frame-1.test" },
      scopeApplied: true,
    });
    const buildIndexSpy = vi
      .spyOn(domTree, "buildSessionDomIndex")
      .mockImplementation(() => {
        throw new Error("should not build session index when scoped");
      });

    const result = await capture.captureHybridSnapshot(page, options);

    expect(result.combinedTree).toBe("scoped outline");
    expect(result.combinedUrlMap["0-100"]).toBe("https://frame-1.test");
    expect(domMapsSpy).toHaveBeenCalled();
    expect(a11ySpy).toHaveBeenCalled();
    expect(buildIndexSpy).not.toHaveBeenCalled();
  });

  it("scoped snapshot still succeeds when iframe inclusion is disabled", async () => {
    const session = new MockCDPSession({}, "session-a");
    const page = makePage({
      getSessionForFrame: () => session,
    });
    const options = { focusSelector: "/html", includeIframes: false };

    vi.spyOn(focusSelectors, "resolveFocusFrameAndTail").mockResolvedValue({
      targetFrameId: "frame-1",
      tailXPath: "",
      absPrefix: "",
    });
    const domMapsSpy = vi
      .spyOn(domTree, "domMapsForSession")
      .mockResolvedValue({
        tagNameMap: { "0-100": "#document" },
        xpathMap: { "0-100": "/" },
        scrollableMap: {},
      });
    const a11ySpy = vi.spyOn(a11yTree, "a11yForFrame").mockResolvedValue({
      outline: "scoped outline",
      urlMap: { "0-100": "https://frame-1.test" },
      scopeApplied: true,
    });
    const buildIndexSpy = vi
      .spyOn(domTree, "buildSessionDomIndex")
      .mockImplementation(() => {
        throw new Error("should not build session index when scoped");
      });

    const result = await capture.captureHybridSnapshot(page, options);

    expect(result.combinedTree).toBe("scoped outline");
    expect(result.combinedUrlMap["0-100"]).toBe("https://frame-1.test");
    expect(domMapsSpy).toHaveBeenCalled();
    expect(a11ySpy).toHaveBeenCalled();
    expect(buildIndexSpy).not.toHaveBeenCalled();
  });

  it("collects per-frame data and merges it when no scoped snapshot is available", async () => {
    const session = new MockCDPSession(
      {
        "DOM.getFrameOwner": async () => ({ backendNodeId: 150 }),
      },
      "session-a",
    );
    const page = makePage({
      asProtocolFrameTree: () =>
        makeFrameTree("frame-1", [makeFrameTree("frame-2")]),
      listAllFrameIds: () => ["frame-1", "frame-2"],
      getSessionForFrame: () => session,
      getOrdinal: (frameId: string) => (frameId === "frame-1" ? 0 : 1),
    });

    const idx = makeSessionIndex();
    vi.spyOn(domTree, "buildSessionDomIndex").mockResolvedValue(idx);
    vi.spyOn(a11yTree, "a11yForFrame").mockImplementation(
      async (_sess, frameId) => ({
        outline:
          frameId === "frame-1"
            ? "[0-150] iframe host"
            : "[1-200] child subtree",
        urlMap: { [`url-${frameId}`]: `https://${frameId}.test` },
        scopeApplied: false,
      }),
    );

    const snapshot = await capture.captureHybridSnapshot(page);

    expect(snapshot.combinedTree).toContain("[1-200] child subtree");
    expect(snapshot.combinedXpathMap["0-100"]).toBe("/");
    expect(snapshot.combinedXpathMap["1-201"]).toBe(
      "/html[1]/body[1]/iframe[1]/div[1]",
    );
    expect(snapshot.combinedUrlMap["url-frame-2"]).toBe("https://frame-2.test");
    expect(snapshot.perFrame?.map((pf) => pf.frameId)).toEqual([
      "frame-1",
      "frame-2",
    ]);
  });

  it("omits iframe frames when includeIframes is false", async () => {
    const session = new MockCDPSession(
      {
        "DOM.getFrameOwner": async () => ({ backendNodeId: 150 }),
      },
      "session-a",
    );
    const page = makePage({
      asProtocolFrameTree: () =>
        makeFrameTree("frame-1", [makeFrameTree("frame-2")]),
      listAllFrameIds: () => ["frame-1", "frame-2"],
      getSessionForFrame: () => session,
      getOrdinal: (frameId: string) => (frameId === "frame-1" ? 0 : 1),
    });

    const idx = makeSessionIndex();
    vi.spyOn(domTree, "buildSessionDomIndex").mockResolvedValue(idx);
    const a11ySpy = vi
      .spyOn(a11yTree, "a11yForFrame")
      .mockImplementation(async (_sess, frameId) => ({
        outline:
          frameId === "frame-1"
            ? "[0-150] iframe host"
            : "[1-200] child subtree",
        urlMap: { [`url-${frameId}`]: `https://${frameId}.test` },
        scopeApplied: false,
      }));

    const snapshot = await capture.captureHybridSnapshot(page, {
      includeIframes: false,
    });

    expect(a11ySpy).toHaveBeenCalledTimes(1);
    expect(session.callsFor("DOM.getFrameOwner")).toHaveLength(0);
    expect(snapshot.perFrame?.map((pf) => pf.frameId)).toEqual(["frame-1"]);
    expect(snapshot.combinedXpathMap["1-201"]).toBeUndefined();
    expect(snapshot.combinedTree).not.toContain("[1-200] child subtree");
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-cbor.test.ts
================================================
import { describe, expect, it } from "vitest";
import type { Protocol } from "devtools-protocol";

import { captureHybridSnapshot } from "../../lib/v3/understudy/a11y/snapshot/index.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";
import type { Page } from "../../lib/v3/understudy/page.js";
import { StagehandDomProcessError } from "../../lib/v3/types/public/sdkErrors.js";
import { CDPSessionLike } from "../../lib/v3/understudy/cdp.js";

type Handler = (params?: Record<string, unknown>) => Promise<unknown> | unknown;

function createFakePage(session: CDPSessionLike): Page {
  const frameTree: Protocol.Page.FrameTree = {
    frame: {
      id: "root" as Protocol.Page.FrameId,
      loaderId: "root-loader" as Protocol.Network.LoaderId,
      url: "http://fake",
      domainAndRegistry: "fake",
      securityOrigin: "http://fake",
      mimeType: "text/html",
      secureContextType: "Secure",
      crossOriginIsolatedContextType: "NotIsolated",
      gatedAPIFeatures: [],
    },
    childFrames: [],
  };

  return {
    mainFrameId: () => "root",
    asProtocolFrameTree: () => frameTree,
    listAllFrameIds: () => ["root"],
    getSessionForFrame: () => session,
    getOrdinal: () => 0,
  } as unknown as Page;
}

function completeDomTree(): Protocol.DOM.Node {
  return {
    nodeId: 1,
    backendNodeId: 1,
    nodeType: 9,
    nodeName: "#document",
    childNodeCount: 1,
    children: [
      {
        nodeId: 2,
        backendNodeId: 2,
        nodeType: 1,
        nodeName: "HTML",
        childNodeCount: 1,
        children: [
          {
            nodeId: 3,
            backendNodeId: 3,
            nodeType: 1,
            nodeName: "BODY",
            childNodeCount: 1,
            children: [
              {
                nodeId: 4,
                backendNodeId: 4,
                nodeType: 1,
                nodeName: "DIV",
                childNodeCount: 0,
                children: [],
              },
            ],
          },
        ],
      },
    ],
  } as Protocol.DOM.Node;
}

function truncatedDomTree(): Protocol.DOM.Node {
  return {
    nodeId: 1,
    backendNodeId: 1,
    nodeType: 9,
    nodeName: "#document",
    childNodeCount: 1,
    children: [
      {
        nodeId: 2,
        backendNodeId: 2,
        nodeType: 1,
        nodeName: "HTML",
        childNodeCount: 1,
        children: [],
      },
    ],
  } as Protocol.DOM.Node;
}

function htmlWithChildren(): Protocol.DOM.Node {
  return {
    nodeId: 2,
    backendNodeId: 2,
    nodeType: 1,
    nodeName: "HTML",
    childNodeCount: 1,
    children: [
      {
        nodeId: 3,
        backendNodeId: 3,
        nodeType: 1,
        nodeName: "BODY",
        childNodeCount: 1,
        children: [
          {
            nodeId: 4,
            backendNodeId: 4,
            nodeType: 1,
            nodeName: "DIV",
            childNodeCount: 0,
            children: [],
          },
        ],
      },
    ],
  } as Protocol.DOM.Node;
}

function simpleAxNodes(): Protocol.Accessibility.AXNode[] {
  const stringType: Protocol.Accessibility.AXValueType = "string";
  return [
    {
      nodeId: "1",
      role: { type: stringType, value: "RootWebArea" },
      backendDOMNodeId: 2,
      childIds: ["2"],
      ignored: false,
    },
    {
      nodeId: "2",
      role: { type: stringType, value: "generic" },
      name: { type: stringType, value: "Content" },
      backendDOMNodeId: 4,
      parentId: "1",
      childIds: [] as string[],
      ignored: false,
    },
  ];
}

const baseHandlers: Record<string, Handler> = {
  "DOM.enable": async () => ({}),
  "Runtime.enable": async () => ({}),
  "Accessibility.enable": async () => ({}),
  "Accessibility.getFullAXTree": async () => ({ nodes: simpleAxNodes() }),
};

function makeCborError(): Error {
  return new Error("CBOR: stack limit exceeded");
}

describe("captureHybridSnapshot CBOR fallbacks", () => {
  it("retries DOM.getDocument with reduced depths before succeeding", async () => {
    let domCalls = 0;
    const session = new MockCDPSession({
      ...baseHandlers,
      "DOM.getDocument": async (params) => {
        domCalls += 1;
        if (domCalls === 1) throw makeCborError();
        expect(params?.depth).toBe(256);
        return { root: completeDomTree() };
      },
    });

    const page = createFakePage(session);
    const snapshot = await captureHybridSnapshot(page);

    expect(snapshot.combinedTree).toContain("html");
    const depths = session
      .callsFor("DOM.getDocument")
      .map((c) => c.params?.depth);
    expect(depths).toEqual([-1, 256]);
  });

  it("throws StagehandDomProcessError after all DOM.getDocument attempts fail", async () => {
    const session = new MockCDPSession({
      ...baseHandlers,
      "DOM.getDocument": async () => {
        throw makeCborError();
      },
    });

    const page = createFakePage(session);
    await expect(captureHybridSnapshot(page)).rejects.toThrow(
      StagehandDomProcessError,
    );
  });

  it("hydrates truncated nodes by retrying DOM.describeNode depths", async () => {
    let domAttempts = 0;
    let describeAttempts = 0;

    const session = new MockCDPSession({
      ...baseHandlers,
      "DOM.getDocument": async (params) => {
        domAttempts += 1;
        if (domAttempts === 1) throw makeCborError();
        expect(params?.depth).toBe(256);
        return { root: truncatedDomTree() };
      },
      "DOM.describeNode": async (params) => {
        describeAttempts += 1;
        if (describeAttempts === 1) throw makeCborError();
        expect(params?.depth).toBe(64);
        return { node: htmlWithChildren() };
      },
    });

    const page = createFakePage(session);
    const snapshot = await captureHybridSnapshot(page);

    const describeDepths = session
      .callsFor("DOM.describeNode")
      .map((c) => c.params?.depth);
    expect(describeDepths).toEqual([-1, 64]);
    expect(snapshot.combinedXpathMap["0-4"]).toBe("/html[1]/body[1]/div[1]");
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-dom-session-builders.test.ts
================================================
import type { Protocol } from "devtools-protocol";
import { describe, expect, it } from "vitest";
import {
  buildSessionDomIndex,
  domMapsForSession,
  getDomTreeWithFallback,
  hydrateDomTree,
} from "../../lib/v3/understudy/a11y/snapshot/domTree.js";
import { StagehandDomProcessError } from "../../lib/v3/types/public/sdkErrors.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";

let nextNodeId = 1;
const makeDomNode = (
  overrides: Partial<Protocol.DOM.Node> = {},
): Protocol.DOM.Node => {
  const nodeId = overrides.nodeId ?? nextNodeId++;
  const backendNodeId = overrides.backendNodeId ?? nextNodeId++;
  const nodeName = overrides.nodeName ?? "DIV";
  const nodeType = overrides.nodeType ?? 1;
  const children = overrides.children ?? [];
  return {
    nodeId,
    backendNodeId,
    nodeName,
    nodeType,
    localName: overrides.localName ?? nodeName.toLowerCase(),
    nodeValue: overrides.nodeValue ?? "",
    childNodeCount: overrides.childNodeCount ?? children.length,
    children,
    shadowRoots: overrides.shadowRoots,
    contentDocument: overrides.contentDocument,
    isScrollable: overrides.isScrollable,
  };
};

const buildSampleDomTree = () => {
  const iframeChild = makeDomNode({ nodeName: "P" });
  const iframeBody = makeDomNode({
    nodeName: "BODY",
    children: [iframeChild],
    isScrollable: true,
  });
  const iframeHtml = makeDomNode({ nodeName: "HTML", children: [iframeBody] });
  const iframeDoc = makeDomNode({
    nodeName: "#document",
    nodeType: 9,
    children: [iframeHtml],
  });
  const iframeElement = makeDomNode({
    nodeName: "IFRAME",
    contentDocument: iframeDoc,
  });
  const scrollDiv = makeDomNode({
    nodeName: "DIV",
    isScrollable: true,
  });
  const body = makeDomNode({
    nodeName: "BODY",
    children: [scrollDiv, iframeElement],
  });
  const html = makeDomNode({ nodeName: "HTML", children: [body] });
  const root = makeDomNode({
    nodeName: "#document",
    nodeType: 9,
    children: [html],
  });
  return {
    root,
    html,
    body,
    scrollDiv,
    iframeElement,
    iframeDoc,
    iframeHtml,
    iframeBody,
    iframeChild,
  };
};

describe("hydrateDomTree", () => {
  it("expands truncated nodes by calling DOM.describeNode", async () => {
    const child = makeDomNode({ nodeName: "DIV" });
    const root = makeDomNode({
      nodeName: "HTML",
      childNodeCount: 1,
      children: [],
    });

    const session = new MockCDPSession({
      "DOM.describeNode": async () => ({
        node: {
          ...root,
          children: [child],
          childNodeCount: 1,
        },
      }),
    });

    await hydrateDomTree(session, root, true);
    expect(root.children).toEqual([child]);
  });

  it("retries describeNode when CBOR errors occur before succeeding", async () => {
    const child = makeDomNode({ nodeName: "DIV" });
    const root = makeDomNode({
      nodeName: "HTML",
      childNodeCount: 1,
      children: [],
    });

    let attempts = 0;
    const session = new MockCDPSession({
      "DOM.describeNode": async () => {
        attempts++;
        if (attempts === 1) throw new Error("CBOR: stack limit exceeded");
        return { node: { ...root, children: [child], childNodeCount: 1 } };
      },
    });

    await hydrateDomTree(session, root, true);
    expect(attempts).toBe(2);
    expect(root.children).toEqual([child]);
  });

  it("throws StagehandDomProcessError after exhausting describeNode retries", async () => {
    const root = makeDomNode({
      nodeName: "HTML",
      childNodeCount: 1,
      children: [],
    });
    const session = new MockCDPSession({
      "DOM.describeNode": async () => {
        throw new Error("CBOR: stack limit exceeded");
      },
    });

    await expect(hydrateDomTree(session, root, true)).rejects.toBeInstanceOf(
      StagehandDomProcessError,
    );
  });
});

describe("getDomTreeWithFallback", () => {
  it("retries DOM.getDocument after CBOR errors and returns the hydrated root", async () => {
    const root = makeDomNode({
      nodeName: "#document",
      nodeType: 9,
      children: [],
    });
    const depths: number[] = [];
    const session = new MockCDPSession({
      "DOM.getDocument": async (params) => {
        const depth = (params?.depth ?? 0) as number;
        depths.push(depth);
        if (depth === -1) throw new Error("CBOR: stack limit exceeded");
        return { root };
      },
      "DOM.describeNode": async () => ({ node: root }),
    });

    const result = await getDomTreeWithFallback(session, true);
    expect(result).toBe(root);
    expect(depths).toEqual([-1, 256]);
  });

  it("propagates non-CBOR DOM.getDocument errors", async () => {
    const session = new MockCDPSession({
      "DOM.getDocument": async () => {
        throw new Error("network fail");
      },
    });
    await expect(getDomTreeWithFallback(session, false)).rejects.toThrow(
      "network fail",
    );
  });

  it("throws StagehandDomProcessError when all depth attempts hit CBOR limits", async () => {
    const session = new MockCDPSession({
      "DOM.getDocument": async () => {
        throw new Error("CBOR: stack limit exceeded");
      },
    });
    await expect(getDomTreeWithFallback(session, false)).rejects.toBeInstanceOf(
      StagehandDomProcessError,
    );
  });
});

describe("buildSessionDomIndex", () => {
  it("collects absolute paths, scrollability, and content-document metadata", async () => {
    const tree = buildSampleDomTree();
    const session = new MockCDPSession({
      "DOM.enable": async () => ({}),
      "DOM.getDocument": async () => ({ root: tree.root }),
      "DOM.describeNode": async () => ({ node: tree.root }),
    });

    const index = await buildSessionDomIndex(session, true);

    expect(index.rootBackend).toBe(tree.root.backendNodeId);
    expect(index.absByBe.get(tree.body.backendNodeId)).toBe("/html[1]/body[1]");
    expect(index.absByBe.get(tree.scrollDiv.backendNodeId)).toBe(
      "/html[1]/body[1]/div[1]",
    );
    expect(index.scrollByBe.get(tree.scrollDiv.backendNodeId)).toBe(true);
    expect(index.docRootOf.get(tree.iframeHtml.backendNodeId)).toBe(
      tree.iframeDoc.backendNodeId,
    );
    expect(
      index.contentDocRootByIframe.get(tree.iframeElement.backendNodeId),
    ).toBe(tree.iframeDoc.backendNodeId);
  });
});

describe("domMapsForSession", () => {
  it("derives frame-relative xpath/tag/scrollable maps for a frame's document root", async () => {
    const tree = buildSampleDomTree();
    const session = new MockCDPSession({
      "DOM.enable": async () => ({}),
      "DOM.getDocument": async () => ({ root: tree.root }),
      "DOM.getFrameOwner": async () => ({
        backendNodeId: tree.iframeElement.backendNodeId,
      }),
      "DOM.describeNode": async () => ({ node: tree.root }),
    });

    const encode = (frameId: string, backendNodeId: number) =>
      `${frameId}-${backendNodeId}`;
    const maps = await domMapsForSession(
      session,
      "frame-A",
      true,
      encode,
      true,
    );

    const iframeDocKey = `frame-A-${tree.iframeDoc.backendNodeId}`;
    const iframeBodyKey = `frame-A-${tree.iframeBody.backendNodeId}`;
    const iframeChildKey = `frame-A-${tree.iframeChild.backendNodeId}`;

    expect(maps.tagNameMap[iframeDocKey]).toBe("#document");
    expect(maps.xpathMap[iframeDocKey]).toBe("/");
    expect(maps.xpathMap[iframeBodyKey]).toBe("/html[1]/body[1]");
    expect(maps.xpathMap[iframeChildKey]).toBe("/html[1]/body[1]/p[1]");
    expect(maps.scrollableMap[iframeBodyKey]).toBe(true);
    expect(Object.keys(maps.tagNameMap)).not.toContain(
      `frame-A-${tree.html.backendNodeId}`,
    );
  });

  it("falls back to the root document when frame owner lookup fails", async () => {
    const tree = buildSampleDomTree();
    const session = new MockCDPSession({
      "DOM.enable": async () => ({}),
      "DOM.getDocument": async () => ({ root: tree.root }),
      "DOM.getFrameOwner": async () => {
        throw new Error("owner lookup failed");
      },
      "DOM.describeNode": async () => ({ node: tree.root }),
    });

    const encode = (frameId: string, backendNodeId: number) =>
      `${frameId}-${backendNodeId}`;
    const maps = await domMapsForSession(
      session,
      "frame-B",
      false,
      encode,
      true,
    );

    expect(maps.xpathMap[`frame-B-${tree.html.backendNodeId}`]).toBe(
      "/html[1]",
    );
    expect(maps.xpathMap[`frame-B-${tree.scrollDiv.backendNodeId}`]).toBe(
      "/html[1]/body[1]/div[1]",
    );
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-dom-tree-utils.test.ts
================================================
import type { Protocol } from "devtools-protocol";
import { describe, expect, it } from "vitest";
import {
  collectDomTraversalTargets,
  findNodeByBackendId,
  mergeDomNodes,
  shouldExpandNode,
} from "../../lib/v3/understudy/a11y/snapshot/domTree.js";

let nextNodeId = 1;
const makeNode = (
  overrides: Partial<Protocol.DOM.Node> = {},
): Protocol.DOM.Node => {
  const base: Protocol.DOM.Node = {
    nodeId: nextNodeId++,
    backendNodeId: nextNodeId++,
    nodeType: 1,
    nodeName: "DIV",
    localName: "div",
    nodeValue: "",
    childNodeCount:
      overrides.childNodeCount ??
      (overrides.children ? overrides.children.length : 0),
  };
  return { ...base, ...overrides };
};

describe("shouldExpandNode", () => {
  it("returns true when declared children exceed realized children", () => {
    const node = makeNode({
      childNodeCount: 2,
      children: [makeNode()],
    });
    expect(shouldExpandNode(node)).toBe(true);
  });

  it("returns false when all declared children are realized", () => {
    const child = makeNode();
    const node = makeNode({
      childNodeCount: 1,
      children: [child],
    });
    expect(shouldExpandNode(node)).toBe(false);
  });
});

describe("mergeDomNodes", () => {
  it("overrides structural fields with expanded node data", () => {
    const originalChildren = [makeNode({ nodeName: "SPAN" })];
    const target = makeNode({
      childNodeCount: 1,
      children: originalChildren,
      shadowRoots: [makeNode({ nodeName: "shadow-old" })],
      contentDocument: makeNode({ nodeName: "doc-old" }),
    });
    const source = makeNode({
      childNodeCount: 3,
      children: [makeNode({ nodeName: "DIV" })],
      shadowRoots: [],
      contentDocument: makeNode({ nodeName: "doc-new" }),
    });

    mergeDomNodes(target, source);

    expect(target.childNodeCount).toBe(3);
    expect(target.children).toEqual(source.children);
    expect(target.shadowRoots).toEqual([]);
    expect(target.contentDocument?.nodeName).toBe("doc-new");
  });

  it("preserves original structures when source omits them", () => {
    const child = makeNode();
    const target = makeNode({
      childNodeCount: 1,
      children: [child],
    });
    const source = makeNode({
      childNodeCount: 5,
    });

    mergeDomNodes(target, source);

    expect(target.childNodeCount).toBe(5);
    expect(target.children).toEqual([child]);
  });
});

describe("collectDomTraversalTargets", () => {
  it("returns children, shadow roots, and content document in order", () => {
    const childA = makeNode({ nodeName: "CHILD-A" });
    const childB = makeNode({ nodeName: "CHILD-B" });
    const shadow = makeNode({ nodeName: "SHADOW" });
    const content = makeNode({ nodeName: "CONTENT" });

    const node = makeNode({
      children: [childA, childB],
      shadowRoots: [shadow],
      contentDocument: content,
    });

    const targets = collectDomTraversalTargets(node);
    expect(targets).toEqual([childA, childB, shadow, content]);
  });
});

describe("findNodeByBackendId", () => {
  it("finds nodes nested within children and shadow roots", () => {
    const target = makeNode({ backendNodeId: 999, nodeName: "TARGET" });
    const root = makeNode({
      children: [
        makeNode({
          children: [makeNode(), target],
        }),
      ],
      shadowRoots: [makeNode()],
    });

    expect(findNodeByBackendId(root, 999)).toBe(target);
  });

  it("returns undefined when no node matches the backend id", () => {
    const root = makeNode({
      children: [makeNode()],
      shadowRoots: [makeNode()],
    });
    expect(findNodeByBackendId(root, 123456)).toBeUndefined();
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-focus-selectors-utils.test.ts
================================================
import type { Step } from "../../lib/v3/types/private/snapshot.js";
import { describe, expect, it } from "vitest";
import {
  buildXPathFromSteps,
  IFRAME_STEP_RE,
  listChildrenOf,
  parseXPathToSteps,
} from "../../lib/v3/understudy/a11y/snapshot/focusSelectors.js";

describe("parseXPathToSteps", () => {
  it("records axis direction and normalized names", () => {
    const steps = parseXPathToSteps(" //iframe[1]/div[2]//SPAN ");
    expect(steps).toEqual([
      { axis: "desc", raw: "iframe[1]", name: "iframe" },
      { axis: "child", raw: "div[2]", name: "div" },
      { axis: "desc", raw: "SPAN", name: "span" },
    ]);
  });

  it("drops empty segments and returns [] for blank input", () => {
    expect(parseXPathToSteps("   ")).toEqual([]);
    expect(parseXPathToSteps("/ ")).toEqual([]);
  });
});

describe("buildXPathFromSteps", () => {
  it("reconstructs descendant and child hops as a string", () => {
    const steps: ReadonlyArray<Step> = [
      { axis: "child", raw: "iframe[1]", name: "iframe" },
      { axis: "desc", raw: "div[@id='main']", name: "div" },
      { axis: "child", raw: "span", name: "span" },
    ];
    expect(buildXPathFromSteps(steps)).toBe("/iframe[1]//div[@id='main']/span");
  });

  it("returns '/' for empty sequences", () => {
    expect(buildXPathFromSteps([])).toBe("/");
  });
});

describe("IFRAME_STEP_RE — frame boundary detection", () => {
  it("matches both iframe and frame with optional index", () => {
    expect(IFRAME_STEP_RE.test("iframe")).toBe(true);
    expect(IFRAME_STEP_RE.test("iframe[1]")).toBe(true);
    expect(IFRAME_STEP_RE.test("frame")).toBe(true);
    expect(IFRAME_STEP_RE.test("frame[4]")).toBe(true);
  });

  it("does NOT match frameset", () => {
    expect(IFRAME_STEP_RE.test("frameset")).toBe(false);
    expect(IFRAME_STEP_RE.test("frameset[1]")).toBe(false);
  });
});

describe("parseXPathToSteps — frameset XPaths", () => {
  it("parses a frameset page XPath with frame[N] steps", () => {
    const steps = parseXPathToSteps(
      "/html[1]/frameset[1]/frame[4]/html[1]/body[1]/table[1]",
    );
    expect(steps).toEqual([
      { axis: "child", raw: "html[1]", name: "html" },
      { axis: "child", raw: "frameset[1]", name: "frameset" },
      { axis: "child", raw: "frame[4]", name: "frame" },
      { axis: "child", raw: "html[1]", name: "html" },
      { axis: "child", raw: "body[1]", name: "body" },
      { axis: "child", raw: "table[1]", name: "table" },
    ]);
    // frame[4] step should be detected as a frame boundary
    const frameBoundaries = steps.filter((s) => IFRAME_STEP_RE.test(s.name));
    expect(frameBoundaries).toHaveLength(1);
    expect(frameBoundaries[0].raw).toBe("frame[4]");
  });

  it("detects iframe boundaries in standard iframe XPaths", () => {
    const steps = parseXPathToSteps(
      "/html[1]/body[1]/div[2]/iframe[1]/html[1]/body[1]/p[1]",
    );
    const frameBoundaries = steps.filter((s) => IFRAME_STEP_RE.test(s.name));
    expect(frameBoundaries).toHaveLength(1);
    expect(frameBoundaries[0].raw).toBe("iframe[1]");
  });

  it("does NOT detect frameset as a frame boundary", () => {
    const steps = parseXPathToSteps("/html[1]/frameset[1]/frame[2]");
    const frameBoundaries = steps.filter((s) => IFRAME_STEP_RE.test(s.name));
    expect(frameBoundaries).toHaveLength(1);
    // Only frame[2] matches, not frameset[1]
    expect(frameBoundaries[0].raw).toBe("frame[2]");
  });
});

describe("listChildrenOf", () => {
  it("returns direct children whose parent matches the provided id", () => {
    const parentByFrame = new Map<string, string | null>([
      ["frame-1", null],
      ["frame-2", "frame-1"],
      ["frame-3", "frame-1"],
      ["frame-4", "frame-2"],
    ]);
    expect(listChildrenOf(parentByFrame, "frame-1")).toEqual([
      "frame-2",
      "frame-3",
    ]);
    expect(listChildrenOf(parentByFrame, "frame-4")).toEqual([]);
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-frame-merge.test.ts
================================================
import { describe, expect, it } from "vitest";
import type {
  FrameContext,
  FrameDomMaps,
} from "../../lib/v3/types/private/index.js";
import type { Page } from "../../lib/v3/understudy/page.js";
import { MockCDPSession } from "./helpers/mockCDPSession.js";
import {
  computeFramePrefixes,
  mergeFramesIntoSnapshot,
} from "../../lib/v3/understudy/a11y/snapshot/capture.js";

const makePage = (sessions: Record<string, MockCDPSession>): Page =>
  ({
    getSessionForFrame: (frameId: string) => sessions[frameId] ?? sessions.root,
    getOrdinal: (frameId: string) =>
      frameId === "frame-1" ? 0 : frameId === "frame-2" ? 1 : 2,
  }) as unknown as Page;

describe("computeFramePrefixes", () => {
  it("derives prefixes from parent iframe xpaths within the same session", async () => {
    const parentSession = new MockCDPSession({
      "DOM.getFrameOwner": async () => ({ backendNodeId: 200 }),
    });
    const page = makePage({
      "frame-1": parentSession,
      "frame-2": parentSession,
      root: parentSession,
    });

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: { "0-200": "/html[1]/body[1]/iframe[1]" },
        },
      ],
    ]);

    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const { absPrefix, iframeHostEncByChild } = await computeFramePrefixes(
      page,
      context,
      perFrameMaps,
      context.frames,
    );

    expect(absPrefix.get("frame-1")).toBe("");
    expect(absPrefix.get("frame-2")).toBe("/html[1]/body[1]/iframe[1]");
    expect(iframeHostEncByChild.get("frame-2")).toBe("0-200");
  });

  it("inherits the parent prefix when frame owner lookups fail (OOPIF)", async () => {
    const parentSession = new MockCDPSession({
      "DOM.getFrameOwner": async (params) => {
        if (params?.frameId === "frame-2") return { backendNodeId: 200 };
        if (params?.frameId === "frame-3") throw new Error("unavailable");
        return {};
      },
    });
    const page = makePage({
      "frame-1": parentSession,
      "frame-2": parentSession,
      "frame-3": parentSession,
      root: parentSession,
    });

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: { "0-200": "/iframe[1]" },
        },
      ],
      [
        "frame-2",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: { "1-300": "/div[1]/iframe[1]" },
        },
      ],
    ]);

    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2", "frame-3"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
        ["frame-3", "frame-2"],
      ]),
    };

    const maps = await computeFramePrefixes(
      page,
      context,
      perFrameMaps,
      context.frames,
    );

    expect(maps.absPrefix.get("frame-2")).toBe("/iframe[1]");
    expect(maps.absPrefix.get("frame-3")).toBe("/iframe[1]");
  });

  it("inherits parent prefix when iframe xpath mapping is missing", async () => {
    const session = new MockCDPSession({
      "DOM.getFrameOwner": async () => ({ backendNodeId: 999 }),
    });
    const page = makePage({
      "frame-1": session,
      "frame-2": session,
      root: session,
    });

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: {},
        },
      ],
    ]);

    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const result = await computeFramePrefixes(
      page,
      context,
      perFrameMaps as Map<string, FrameDomMaps>,
      context.frames,
    );
    expect(result.absPrefix.get("frame-2")).toBe("");
  });

  it("does not compute prefixes for frames excluded from the scope", async () => {
    const session = new MockCDPSession({
      "DOM.getFrameOwner": async () => ({ backendNodeId: 200 }),
    });
    const page = makePage({
      "frame-1": session,
      "frame-2": session,
      root: session,
    });

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: { "0-200": "/iframe[1]" },
        },
      ],
    ]);

    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const { absPrefix, iframeHostEncByChild } = await computeFramePrefixes(
      page,
      context,
      perFrameMaps,
      ["frame-1"],
    );

    expect(absPrefix.has("frame-2")).toBe(false);
    expect(iframeHostEncByChild.has("frame-2")).toBe(false);
  });
});

describe("mergeFramesIntoSnapshot", () => {
  it("merges root and child maps, prefixing child xpaths and injecting subtrees", () => {
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: { "0-10": "https://example.com" },
          xpathMap: { "0-10": "/html[1]/body[1]" },
        },
      ],
      [
        "frame-2",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: { "1-20": "https://child.com" },
          xpathMap: { "1-20": "/div[1]/span[1]" },
        },
      ],
    ]);

    const perFrameOutlines = [
      { frameId: "frame-1", outline: "[0-10] body\n  [0-200] iframe" },
      { frameId: "frame-2", outline: "[1-20] child" },
    ];

    const absPrefix = new Map<string, string>([
      ["frame-1", ""],
      ["frame-2", "/html[1]/body[1]/iframe[1]"],
    ]);
    const iframeHostEncByChild = new Map<string, string>([
      ["frame-2", "0-200"],
    ]);

    const snapshot = mergeFramesIntoSnapshot(
      context,
      perFrameMaps,
      perFrameOutlines,
      absPrefix,
      iframeHostEncByChild,
      context.frames,
    );

    expect(snapshot.combinedXpathMap["0-10"]).toBe("/html[1]/body[1]");
    expect(snapshot.combinedXpathMap["1-20"]).toBe(
      "/html[1]/body[1]/iframe[1]/div[1]/span[1]",
    );
    expect(snapshot.combinedUrlMap["1-20"]).toBe("https://child.com");
    expect(snapshot.combinedTree).toContain("[1-20] child");
  });

  it("skips frames without maps and handles missing iframe mappings", () => {
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: { "0-10": "/html[1]" },
        },
      ],
    ]);

    const perFrameOutlines = [
      { frameId: "frame-1", outline: "[0-10] html" },
      { frameId: "frame-2", outline: "[1-20] orphan" },
    ];

    const absPrefix = new Map<string, string>([
      ["frame-1", ""],
      ["frame-2", "/missing"],
    ]);

    const snapshot = mergeFramesIntoSnapshot(
      context,
      perFrameMaps,
      perFrameOutlines,
      absPrefix,
      new Map(),
      context.frames,
    );

    expect(snapshot.combinedXpathMap["1-20"]).toBeUndefined();
    expect(snapshot.combinedTree).toBe("[0-10] html");
  });

  it("falls back to first outline when root frame outline is missing", () => {
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-2",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: {},
        },
      ],
    ]);

    const perFrameOutlines = [
      { frameId: "frame-2", outline: "[child] frame2" },
    ];

    const snapshot = mergeFramesIntoSnapshot(
      context,
      perFrameMaps,
      perFrameOutlines,
      new Map([["frame-2", "/iframe[1]"]]),
      new Map(),
      context.frames,
    );

    expect(snapshot.combinedTree).toBe("[child] frame2");
  });

  it("overwrites duplicate iframe host entries when multiple children map to the same parent", () => {
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2", "frame-3"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
        ["frame-3", "frame-1"],
      ]),
    };

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: {},
          xpathMap: {},
        },
      ],
    ]);

    const perFrameOutlines = [
      { frameId: "frame-1", outline: "[root] frame1\n  [0-200] iframe slot" },
      { frameId: "frame-2", outline: "[child] frame2" },
      { frameId: "frame-3", outline: "[child] frame3" },
    ];

    const snapshot = mergeFramesIntoSnapshot(
      context,
      perFrameMaps,
      perFrameOutlines,
      new Map([
        ["frame-1", ""],
        ["frame-2", ""],
        ["frame-3", ""],
      ]),
      new Map([
        ["frame-2", "0-200"],
        ["frame-3", "0-200"],
      ]),
      context.frames,
    );

    expect(snapshot.combinedTree).toContain("[child] frame3");
    expect(snapshot.combinedTree).not.toContain("[child] frame2");
  });

  it("only merges xpath and url maps for frames included in frameIds", () => {
    const context: FrameContext = {
      rootId: "frame-1",
      frames: ["frame-1", "frame-2"],
      parentByFrame: new Map([
        ["frame-1", null],
        ["frame-2", "frame-1"],
      ]),
    };

    const perFrameMaps = new Map<string, FrameDomMaps>([
      [
        "frame-1",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: { "0-10": "https://root.test" },
          xpathMap: { "0-10": "/html[1]" },
        },
      ],
      [
        "frame-2",
        {
          tagNameMap: {},
          scrollableMap: {},
          urlMap: { "1-20": "https://child.test" },
          xpathMap: { "1-20": "/div[1]" },
        },
      ],
    ]);

    const perFrameOutlines = [{ frameId: "frame-1", outline: "[root] doc" }];

    const snapshot = mergeFramesIntoSnapshot(
      context,
      perFrameMaps,
      perFrameOutlines,
      new Map([["frame-1", ""]]),
      new Map(),
      ["frame-1"],
    );

    expect(snapshot.combinedXpathMap["0-10"]).toBe("/html[1]");
    expect(snapshot.combinedXpathMap["1-20"]).toBeUndefined();
    expect(snapshot.perFrame?.map((pf) => pf.frameId)).toEqual(["frame-1"]);
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-tree-format-utils.test.ts
================================================
import { describe, expect, it } from "vitest";
import {
  cleanText,
  diffCombinedTrees,
  formatTreeLine,
  indentBlock,
  injectSubtrees,
  normaliseSpaces,
} from "../../lib/v3/understudy/a11y/snapshot/treeFormatUtils.js";

describe("formatTreeLine", () => {
  it("includes encoded ids and indents children", () => {
    const outline = formatTreeLine({
      role: "section",
      name: "Container",
      encodedId: "frame-1",
      nodeId: "ax-1",
      children: [
        {
          role: "button",
          name: "Submit",
          nodeId: "ax-2",
        },
      ],
    });

    expect(outline).toBe(
      "[frame-1] section: Container\n  [ax-2] button: Submit",
    );
  });
});

describe("injectSubtrees", () => {
  it("nests child outlines under iframe encoded ids", () => {
    const rootOutline = `[root] document\n  [iframe-1] iframe\n  [leaf] item`;
    const iframeOutline = `[child-root] child\n  [nested-frame] iframe`;
    const nestedOutline = `[nested-leaf] nested`;

    const merged = injectSubtrees(
      rootOutline,
      new Map([
        ["iframe-1", iframeOutline],
        ["nested-frame", nestedOutline],
      ]),
    );

    expect(merged).toBe(
      `[root] document
  [iframe-1] iframe
    [child-root] child
      [nested-frame] iframe
        [nested-leaf] nested
  [leaf] item`,
    );
  });

  it("injects child outline only once when the same id repeats", () => {
    const rootOutline = `[root] document
  [iframe-1] iframe
  [iframe-1] iframe`;
    const iframeOutline = `[child-root] child`;

    const merged = injectSubtrees(
      rootOutline,
      new Map([["iframe-1", iframeOutline]]),
    );

    expect(merged).toBe(
      `[root] document
  [iframe-1] iframe
    [child-root] child
  [iframe-1] iframe`,
    );
  });

  it("returns the original outline when no encoded ids are matched", () => {
    const outline = `[root] document\n  [leaf] item`;
    expect(injectSubtrees(outline, new Map([["other", "[x] child"]]))).toBe(
      outline,
    );
  });
});

describe("indentBlock", () => {
  it("prefixes each line with the provided indent", () => {
    expect(indentBlock("a\nb", "  ")).toBe("  a\n  b");
    expect(indentBlock("", "  ")).toBe("");
  });
});

describe("diffCombinedTrees", () => {
  it("returns newly-added lines relative to previous outline", () => {
    const prev = `[root] document\n  [child] a`;
    const next = `[root] document\n  [child] a\n  [child-2] b`;
    expect(diffCombinedTrees(prev, next)).toBe("[child-2] b");
  });

  it("normalizes indentation for added lines with stray spaces", () => {
    const prev = `[root] document\n    [child] a`;
    const next = `[root] document\n    [child] a\n        [child-2] b`;
    expect(diffCombinedTrees(prev, next)).toBe("[child-2] b");
  });
});

describe("cleanText", () => {
  it("removes NBSP and private-use characters while collapsing spaces", () => {
    const dirty = `Hello\u00A0\u00A0world\uE000 !`;
    expect(cleanText(dirty)).toBe("Hello world !");
  });
});

describe("normaliseSpaces", () => {
  it("replaces whitespace runs with a single space", () => {
    expect(normaliseSpaces("a   b\tc\nd")).toBe("a b c d");
  });
});


================================================
FILE: packages/core/tests/unit/snapshot-xpath-utils.test.ts
================================================
import type { Protocol } from "devtools-protocol";
import { describe, expect, it } from "vitest";
import {
  buildChildXPathSegments,
  joinXPath,
  normalizeXPath,
  prefixXPath,
} from "../../lib/v3/understudy/a11y/snapshot/xpathUtils.js";
import { relativizeXPath } from "../../lib/v3/understudy/a11y/snapshot/domTree.js";

describe("prefixXPath", () => {
  it("treats root prefixes as no-op", () => {
    expect(prefixXPath("/", "/div[1]")).toBe("/div[1]");
    expect(prefixXPath("/", "//div[1]")).toBe("//div[1]");
  });

  it("handles descendant hops and blank children", () => {
    expect(prefixXPath("/html/body", "//slot[1]")).toBe("/html/body//slot[1]");
    expect(prefixXPath("/html/body", "/")).toBe("/html/body");
    expect(prefixXPath("/html/body/", "")).toBe("/html/body");
  });
});

describe("normalizeXPath", () => {
  it("strips prefixes, trims whitespace, and enforces absolute roots", () => {
    expect(normalizeXPath("   xpath=/html/body/ ")).toBe("/html/body");
    expect(normalizeXPath("div/span")).toBe("/div/span");
    expect(normalizeXPath("")).toBe("");
    expect(normalizeXPath()).toBe("");
  });
});

describe("relativizeXPath", () => {
  it("returns '/' when paths match exactly", () => {
    expect(relativizeXPath("/html/body", "/html/body")).toBe("/");
  });

  it("omits duplicate prefixes and preserves descendant hops", () => {
    expect(relativizeXPath("/html/body", "/html/body/div[2]")).toBe("/div[2]");
    expect(relativizeXPath("/html/body", "/html/body//shadow-root[1]")).toBe(
      "//shadow-root[1]",
    );
  });

  it("falls back to absolute paths outside of the base document", () => {
    expect(relativizeXPath("/html/body", "/head")).toBe("/head");
    expect(relativizeXPath("/", "/html/body")).toBe("/html/body");
  });
});

describe("buildChildXPathSegments", () => {
  it("produces positional selectors for each node type", () => {
    const makeNode = (
      nodeType: number,
      nodeName: string,
      override?: Partial<Protocol.DOM.Node>,
    ): Protocol.DOM.Node => ({
      nodeId: 1,
      backendNodeId: 1,
      localName: nodeName.toLowerCase(),
      nodeValue: "",
      ...override,
      nodeType,
      nodeName,
    });

    const nodes: Protocol.DOM.Node[] = [
      makeNode(1, "DIV"),
      makeNode(1, "DIV"),
      makeNode(1, "svg:path"),
      makeNode(3, "#text"),
      makeNode(8, "#comment"),
    ];

    expect(buildChildXPathSegments(nodes)).toEqual([
      "div[1]",
      "div[2]",
      "*[name()='svg:path'][1]",
      "text()[1]",
      "comment()[1]",
    ]);
  });
});

describe("joinXPath", () => {
  it("joins base and steps while preserving special hops", () => {
    expect(joinXPath("", "div[1]")).toBe("/div[1]");
    expect(joinXPath("/", "span[1]")).toBe("/span[1]");
    expect(joinXPath("/html/body", "//")).toBe("/html/body//");
    expect(joinXPath("/html//", "slot[1]")).toBe("/html//slot[1]");
    expect(joinXPath("/html/body", "")).toBe("/html/body");
  });
});


================================================
FILE: packages/core/tests/unit/timeout-handlers.test.ts
================================================
import { beforeEach, describe, expect, it, vi } from "vitest";
import { ActHandler } from "../../lib/v3/handlers/actHandler.js";
import { ExtractHandler } from "../../lib/v3/handlers/extractHandler.js";
import { ObserveHandler } from "../../lib/v3/handlers/observeHandler.js";
import type { Page } from "../../lib/v3/understudy/page.js";
import type { ClientOptions } from "../../lib/v3/types/public/model.js";
import type { LLMClient } from "../../lib/v3/llm/LLMClient.js";
import { createTimeoutGuard } from "../../lib/v3/handlers/handlerUtils/timeoutGuard.js";
import { waitForDomNetworkQuiet } from "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js";
import { captureHybridSnapshot } from "../../lib/v3/understudy/a11y/snapshot/index.js";
import {
  ActTimeoutError,
  ExtractTimeoutError,
  ObserveTimeoutError,
} from "../../lib/v3/types/public/sdkErrors.js";
import {
  act as actInference,
  extract as extractInference,
  observe as observeInference,
} from "../../lib/inference.js";
import { V3FunctionName } from "../../lib/v3/types/public/methods.js";

vi.mock("../../lib/v3/handlers/handlerUtils/timeoutGuard", () => ({
  createTimeoutGuard: vi.fn(),
}));

vi.mock("../../lib/v3/handlers/handlerUtils/actHandlerUtils", () => ({
  waitForDomNetworkQuiet: vi.fn(),
  performUnderstudyMethod: vi.fn(),
}));

vi.mock("../../lib/v3/understudy/a11y/snapshot", () => ({
  captureHybridSnapshot: vi.fn(),
  diffCombinedTrees: vi.fn(),
}));

vi.mock("../../lib/inference", () => ({
  act: vi.fn(),
  extract: vi.fn(),
  observe: vi.fn(),
}));

describe("ActHandler timeout guard", () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });

  it("throws ActTimeoutError when timeout expires before snapshot", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    // Make createTimeoutGuard return a guard that throws on call #2
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        let calls = 0;
        return vi.fn(() => {
          calls += 1;
          if (calls >= 2) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ActTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildActHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.act({
        instruction: "do something",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ActTimeoutError);

    // Verify pre-timeout helper ran
    expect(waitForDomNetworkQuietMock).toHaveBeenCalledTimes(1);
    // Verify snapshot was NOT called (timeout fired before it)
    expect(captureHybridSnapshotMock).not.toHaveBeenCalled();
  });

  it("throws ActTimeoutError when timeout expires before LLM call", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    const actInferenceMock = vi.mocked(actInference);

    // Throw on call #3 (after snapshot but before LLM)
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        let calls = 0;
        return vi.fn(() => {
          calls += 1;
          if (calls >= 3) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ActTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildActHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.act({
        instruction: "do something",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ActTimeoutError);

    // Snapshot should have been called
    expect(captureHybridSnapshotMock).toHaveBeenCalledTimes(1);
    // LLM inference should NOT have been called
    expect(actInferenceMock).not.toHaveBeenCalled();
  });

  it("throws ActTimeoutError with correct message format", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const timeoutMs = 100;

    vi.mocked(createTimeoutGuard).mockImplementation((ms, errorFactory) => {
      return vi.fn(() => {
        throw errorFactory ? errorFactory(ms!) : new ActTimeoutError(ms!);
      });
    });

    const handler = buildActHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    try {
      await handler.act({
        instruction: "do something",
        page: fakePage,
        timeout: timeoutMs,
      });
      throw new Error("Expected ActTimeoutError to be thrown");
    } catch (error) {
      expect(error).toBeInstanceOf(ActTimeoutError);
      expect((error as ActTimeoutError).message).toContain("act()");
      expect((error as ActTimeoutError).message).toContain(`${timeoutMs}ms`);
      expect((error as ActTimeoutError).name).toBe("ActTimeoutError");
    }
  });
});

describe("ActHandler two-step timeout", () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });

  it("throws ActTimeoutError during step 2; step 2 action does not run", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const { performUnderstudyMethod } = await import(
      "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js"
    );
    const performUnderstudyMethodMock = vi.mocked(performUnderstudyMethod);
    performUnderstudyMethodMock.mockResolvedValue(undefined);

    const actInferenceMock = vi.mocked(actInference);
    // First call returns a two-step action
    actInferenceMock.mockResolvedValueOnce({
      element: {
        elementId: "1-0",
        description: "click button",
        method: "click",
        arguments: [],
      },
      twoStep: true,
      prompt_tokens: 100,
      completion_tokens: 50,
      inference_time_ms: 500,
    } as ReturnType<typeof actInference> extends Promise<infer T> ? T : never);

    const diffCombinedTreesMock = vi.mocked(
      (await import("../../lib/v3/understudy/a11y/snapshot/index.js"))
        .diffCombinedTrees,
    );
    diffCombinedTreesMock.mockReturnValue("diff tree");

    // Timeout fires after step 1 completes, during step 2 snapshot
    // ensureTimeRemaining calls: 1=before wait, 2=after wait/before snap1, 3=before LLM1,
    // 4=before action1, 5=inside takeDeterministicAction, 6=performUnderstudy,
    // 7=before snap2 (this one should throw)
    let callCount = 0;
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        return vi.fn(() => {
          callCount += 1;
          if (callCount >= 7) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ActTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildActHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.act({
        instruction: "click then type",
        page: fakePage,
        timeout: 50,
      }),
    ).rejects.toThrow(ActTimeoutError);

    // Step 1 action should have been executed
    expect(performUnderstudyMethodMock).toHaveBeenCalledTimes(1);
    // Step 2 LLM call should NOT have happened
    expect(actInferenceMock).toHaveBeenCalledTimes(1);
  });
});

describe("ActHandler self-heal timeout", () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });

  it("throws ActTimeoutError during self-heal snapshot; no retry action executes", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const { performUnderstudyMethod } = await import(
      "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js"
    );
    const performUnderstudyMethodMock = vi.mocked(performUnderstudyMethod);
    // First call fails, triggering self-heal
    performUnderstudyMethodMock.mockRejectedValueOnce(
      new Error("Element not found"),
    );

    const actInferenceMock = vi.mocked(actInference);
    actInferenceMock.mockResolvedValue({
      element: {
        elementId: "1-0",
        description: "click button",
        method: "click",
        arguments: [],
      },
      twoStep: false,
      prompt_tokens: 100,
      completion_tokens: 50,
      inference_time_ms: 500,
    } as ReturnType<typeof actInference> extends Promise<infer T> ? T : never);

    // Timeout during self-heal snapshot (call 7 or later)
    let callCount = 0;
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        return vi.fn(() => {
          callCount += 1;
          // Timeout during self-heal snapshot call
          if (callCount >= 7) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ActTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildActHandler({ selfHeal: true });
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.act({
        instruction: "click button",
        page: fakePage,
        timeout: 50,
      }),
    ).rejects.toThrow(ActTimeoutError);

    // First action attempt should have been tried
    expect(performUnderstudyMethodMock).toHaveBeenCalledTimes(1);
    // First LLM call should have happened
    expect(actInferenceMock).toHaveBeenCalledTimes(1);
    // Self-heal snapshot should have been started (call happened)
    expect(captureHybridSnapshotMock).toHaveBeenCalled();
  });

  it("throws ActTimeoutError during self-heal LLM inference; no retry action executes", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const { performUnderstudyMethod } = await import(
      "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js"
    );
    const performUnderstudyMethodMock = vi.mocked(performUnderstudyMethod);
    // First call fails, triggering self-heal
    performUnderstudyMethodMock.mockRejectedValueOnce(
      new Error("Element not found"),
    );

    const actInferenceMock = vi.mocked(actInference);
    actInferenceMock.mockResolvedValueOnce({
      element: {
        elementId: "1-0",
        description: "click button",
        method: "click",
        arguments: [],
      },
      twoStep: false,
      prompt_tokens: 100,
      completion_tokens: 50,
      inference_time_ms: 500,
    } as ReturnType<typeof actInference> extends Promise<infer T> ? T : never);

    // Timeout during self-heal LLM inference (call 8)
    let callCount = 0;
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        return vi.fn(() => {
          callCount += 1;
          // Timeout during self-heal LLM call
          if (callCount >= 8) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ActTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildActHandler({ selfHeal: true });
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.act({
        instruction: "click button",
        page: fakePage,
        timeout: 50,
      }),
    ).rejects.toThrow(ActTimeoutError);

    // Self-heal snapshot was captured
    expect(captureHybridSnapshotMock).toHaveBeenCalledTimes(2);
    // Only one LLM inference (the retry inference was aborted by timeout)
    expect(actInferenceMock).toHaveBeenCalledTimes(1);
  });
});

describe("ExtractHandler timeout guard", () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });

  it("throws ExtractTimeoutError when timeout expires before snapshot", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    const extractInferenceMock = vi.mocked(extractInference);

    // Throw immediately on first call
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        return vi.fn(() => {
          throw errorFactory
            ? errorFactory(timeoutMs!)
            : new ExtractTimeoutError(timeoutMs!);
        });
      },
    );

    const handler = buildExtractHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.extract({
        instruction: "extract title",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ExtractTimeoutError);

    // Snapshot should NOT have been called
    expect(captureHybridSnapshotMock).not.toHaveBeenCalled();
    // LLM inference should NOT have been called
    expect(extractInferenceMock).not.toHaveBeenCalled();
  });

  it("throws ExtractTimeoutError when timeout expires before LLM call", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    const extractInferenceMock = vi.mocked(extractInference);

    // Throw on call #2 (after snapshot but before LLM)
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        let calls = 0;
        return vi.fn(() => {
          calls += 1;
          if (calls >= 2) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ExtractTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildExtractHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.extract({
        instruction: "extract title",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ExtractTimeoutError);

    // Snapshot should have been called
    expect(captureHybridSnapshotMock).toHaveBeenCalledTimes(1);
    // LLM inference should NOT have been called
    expect(extractInferenceMock).not.toHaveBeenCalled();
  });

  it("throws ExtractTimeoutError with correct message format", async () => {
    const timeoutMs = 200;

    vi.mocked(createTimeoutGuard).mockImplementation((ms, errorFactory) => {
      return vi.fn(() => {
        throw errorFactory ? errorFactory(ms!) : new ExtractTimeoutError(ms!);
      });
    });

    const handler = buildExtractHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    try {
      await handler.extract({
        instruction: "extract title",
        page: fakePage,
        timeout: timeoutMs,
      });
      throw new Error("Expected ExtractTimeoutError to be thrown");
    } catch (error) {
      expect(error).toBeInstanceOf(ExtractTimeoutError);
      expect((error as ExtractTimeoutError).message).toContain("extract()");
      expect((error as ExtractTimeoutError).message).toContain(
        `${timeoutMs}ms`,
      );
      expect((error as ExtractTimeoutError).name).toBe("ExtractTimeoutError");
    }
  });

  it("stops LLM and post-processing when timeout expires", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: { "1-0": "https://example.com" },
    });

    const extractInferenceMock = vi.mocked(extractInference);

    // Allow snapshot but timeout before LLM
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        let calls = 0;
        return vi.fn(() => {
          calls += 1;
          if (calls >= 2) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ExtractTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildExtractHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.extract({
        instruction: "extract links",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ExtractTimeoutError);

    // Post-processing (URL injection) never runs because LLM was never called
    expect(extractInferenceMock).not.toHaveBeenCalled();
  });
});

describe("ObserveHandler timeout guard", () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });

  it("throws ObserveTimeoutError when timeout expires before snapshot", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    const observeInferenceMock = vi.mocked(observeInference);

    // Throw immediately on first call
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        return vi.fn(() => {
          throw errorFactory
            ? errorFactory(timeoutMs!)
            : new ObserveTimeoutError(timeoutMs!);
        });
      },
    );

    const handler = buildObserveHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.observe({
        instruction: "find buttons",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ObserveTimeoutError);

    // Snapshot should NOT have been called
    expect(captureHybridSnapshotMock).not.toHaveBeenCalled();
    // LLM inference should NOT have been called
    expect(observeInferenceMock).not.toHaveBeenCalled();
  });

  it("throws ObserveTimeoutError when timeout expires before LLM call", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    const observeInferenceMock = vi.mocked(observeInference);

    // Throw on call #2 (after snapshot but before LLM)
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        let calls = 0;
        return vi.fn(() => {
          calls += 1;
          if (calls >= 2) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ObserveTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildObserveHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.observe({
        instruction: "find buttons",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ObserveTimeoutError);

    // Snapshot should have been called
    expect(captureHybridSnapshotMock).toHaveBeenCalledTimes(1);
    // LLM inference should NOT have been called
    expect(observeInferenceMock).not.toHaveBeenCalled();
  });

  it("throws ObserveTimeoutError with correct message format", async () => {
    const timeoutMs = 150;

    vi.mocked(createTimeoutGuard).mockImplementation((ms, errorFactory) => {
      return vi.fn(() => {
        throw errorFactory ? errorFactory(ms!) : new ObserveTimeoutError(ms!);
      });
    });

    const handler = buildObserveHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    try {
      await handler.observe({
        instruction: "find buttons",
        page: fakePage,
        timeout: timeoutMs,
      });
      throw new Error("Expected ObserveTimeoutError to be thrown");
    } catch (error) {
      expect(error).toBeInstanceOf(ObserveTimeoutError);
      expect((error as ObserveTimeoutError).message).toContain("observe()");
      expect((error as ObserveTimeoutError).message).toContain(
        `${timeoutMs}ms`,
      );
      expect((error as ObserveTimeoutError).name).toBe("ObserveTimeoutError");
    }
  });

  it("aborts result processing when timeout expires", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const observeInferenceMock = vi.mocked(observeInference);

    // Timeout before LLM call
    vi.mocked(createTimeoutGuard).mockImplementation(
      (timeoutMs, errorFactory) => {
        let calls = 0;
        return vi.fn(() => {
          calls += 1;
          if (calls >= 2) {
            throw errorFactory
              ? errorFactory(timeoutMs!)
              : new ObserveTimeoutError(timeoutMs!);
          }
        });
      },
    );

    const handler = buildObserveHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    await expect(
      handler.observe({
        instruction: "find all interactive elements",
        page: fakePage,
        timeout: 5,
      }),
    ).rejects.toThrow(ObserveTimeoutError);

    // Result mapping/processing never happens
    expect(observeInferenceMock).not.toHaveBeenCalled();
  });
});

describe("No-timeout success paths", () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });

  it("act() completes successfully without timeout and records metrics", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const { performUnderstudyMethod } = await import(
      "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js"
    );
    const performUnderstudyMethodMock = vi.mocked(performUnderstudyMethod);
    performUnderstudyMethodMock.mockResolvedValue(undefined);

    const actInferenceMock = vi.mocked(actInference);
    actInferenceMock.mockResolvedValue({
      element: {
        elementId: "1-0",
        description: "click button",
        method: "click",
        arguments: [],
      },
      twoStep: false,
      prompt_tokens: 100,
      completion_tokens: 50,
      reasoning_tokens: 10,
      cached_input_tokens: 5,
      inference_time_ms: 500,
    } as ReturnType<typeof actInference> extends Promise<infer T> ? T : never);

    // No timeout - guard never throws
    vi.mocked(createTimeoutGuard).mockImplementation(() => {
      return vi.fn(() => {
        // No-op - never throws
      });
    });

    const metricsCallback = vi.fn();
    const handler = buildActHandler({ onMetrics: metricsCallback });
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    const result = await handler.act({
      instruction: "click button",
      page: fakePage,
      // No timeout specified
    });

    expect(result.success).toBe(true);
    expect(metricsCallback).toHaveBeenCalledWith(
      V3FunctionName.ACT,
      100,
      50,
      10,
      5,
      500,
    );
  });

  it("extract() completes successfully without timeout and records metrics", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: {},
      combinedUrlMap: {},
    });

    const extractInferenceMock = vi.mocked(extractInference);
    extractInferenceMock.mockResolvedValue({
      title: "Test Title",
      metadata: { completed: true, progress: "100%" },
      prompt_tokens: 200,
      completion_tokens: 100,
      reasoning_tokens: 20,
      cached_input_tokens: 10,
      inference_time_ms: 800,
    } as ReturnType<typeof extractInference> extends Promise<infer T>
      ? T
      : never);

    // No timeout - guard never throws
    vi.mocked(createTimeoutGuard).mockImplementation(() => {
      return vi.fn(() => {
        // No-op - never throws
      });
    });

    const metricsCallback = vi.fn();
    const handler = buildExtractHandler({ onMetrics: metricsCallback });
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    const result = await handler.extract({
      instruction: "extract title",
      page: fakePage,
      // No timeout specified
    });

    expect(result).toHaveProperty("title", "Test Title");
    expect(metricsCallback).toHaveBeenCalledWith(
      V3FunctionName.EXTRACT,
      200,
      100,
      20,
      10,
      800,
    );
  });

  it("observe() completes successfully without timeout and records metrics", async () => {
    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const observeInferenceMock = vi.mocked(observeInference);
    observeInferenceMock.mockResolvedValue({
      elements: [
        {
          elementId: "1-0",
          description: "Submit button",
        },
      ],
      prompt_tokens: 150,
      completion_tokens: 75,
      reasoning_tokens: 15,
      cached_input_tokens: 8,
      inference_time_ms: 600,
    } as ReturnType<typeof observeInference> extends Promise<infer T>
      ? T
      : never);

    // No timeout - guard never throws
    vi.mocked(createTimeoutGuard).mockImplementation(() => {
      return vi.fn(() => {
        // No-op - never throws
      });
    });

    const metricsCallback = vi.fn();
    const handler = buildObserveHandler({ onMetrics: metricsCallback });
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    const result = await handler.observe({
      instruction: "find buttons",
      page: fakePage,
      // No timeout specified
    });

    expect(result).toHaveLength(1);
    expect(result[0]).toHaveProperty("description", "Submit button");
    expect(metricsCallback).toHaveBeenCalledWith(
      V3FunctionName.OBSERVE,
      150,
      75,
      15,
      8,
      600,
    );
  });

  it("act() with zero timeout behaves as no timeout", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const { performUnderstudyMethod } = await import(
      "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js"
    );
    const performUnderstudyMethodMock = vi.mocked(performUnderstudyMethod);
    performUnderstudyMethodMock.mockResolvedValue(undefined);

    const actInferenceMock = vi.mocked(actInference);
    actInferenceMock.mockResolvedValue({
      element: {
        elementId: "1-0",
        description: "click button",
        method: "click",
        arguments: [],
      },
      twoStep: false,
      prompt_tokens: 100,
      completion_tokens: 50,
      inference_time_ms: 500,
    } as ReturnType<typeof actInference> extends Promise<infer T> ? T : never);

    // When timeout is 0 or negative, createTimeoutGuard returns a no-op
    vi.mocked(createTimeoutGuard).mockImplementation((timeoutMs) => {
      if (!timeoutMs || timeoutMs <= 0) {
        return vi.fn(() => {
          // No-op
        });
      }
      return vi.fn(() => {
        throw new ActTimeoutError(timeoutMs);
      });
    });

    const handler = buildActHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    const result = await handler.act({
      instruction: "click button",
      page: fakePage,
      timeout: 0, // Zero timeout should be treated as "no timeout"
    });

    expect(result.success).toBe(true);
  });

  it("act() with negative timeout behaves as no timeout", async () => {
    const waitForDomNetworkQuietMock = vi.mocked(waitForDomNetworkQuiet);
    waitForDomNetworkQuietMock.mockResolvedValue(undefined);

    const captureHybridSnapshotMock = vi.mocked(captureHybridSnapshot);
    captureHybridSnapshotMock.mockResolvedValue({
      combinedTree: "tree content",
      combinedXpathMap: { "1-0": "/html/body/button" },
      combinedUrlMap: {},
    });

    const { performUnderstudyMethod } = await import(
      "../../lib/v3/handlers/handlerUtils/actHandlerUtils.js"
    );
    const performUnderstudyMethodMock = vi.mocked(performUnderstudyMethod);
    performUnderstudyMethodMock.mockResolvedValue(undefined);

    const actInferenceMock = vi.mocked(actInference);
    actInferenceMock.mockResolvedValue({
      element: {
        elementId: "1-0",
        description: "click button",
        method: "click",
        arguments: [],
      },
      twoStep: false,
      prompt_tokens: 100,
      completion_tokens: 50,
      inference_time_ms: 500,
    } as ReturnType<typeof actInference> extends Promise<infer T> ? T : never);

    vi.mocked(createTimeoutGuard).mockImplementation((timeoutMs) => {
      if (!timeoutMs || timeoutMs <= 0) {
        return vi.fn(() => {
          // No-op
        });
      }
      return vi.fn(() => {
        throw new ActTimeoutError(timeoutMs);
      });
    });

    const handler = buildActHandler();
    const fakePage = {
      mainFrame: vi.fn().mockReturnValue({}),
    } as unknown as Page;

    const result = await handler.act({
      instruction: "click button",
      page: fakePage,
      timeout: -100, // Negative timeout should be treated as "no timeout"
    });

    expect(result.success).toBe(true);
  });
});

interface BuildActHandlerOptions {
  selfHeal?: boolean;
  onMetrics?: (
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ) => void;
}

function buildActHandler(options: BuildActHandlerOptions = {}): ActHandler {
  const defaultClientOptions = {} as ClientOptions;
  const fakeClient = {
    type: "openai",
    modelName: "gpt-4o",
    clientOptions: defaultClientOptions,
  } as LLMClient;
  const resolveLlmClient = vi.fn().mockReturnValue(fakeClient);

  return new ActHandler(
    fakeClient,
    "gpt-4o",
    defaultClientOptions,
    resolveLlmClient,
    undefined,
    false,
    options.selfHeal ?? false,
    options.onMetrics,
    undefined,
  );
}

interface BuildExtractHandlerOptions {
  onMetrics?: (
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ) => void;
}

function buildExtractHandler(
  options: BuildExtractHandlerOptions = {},
): ExtractHandler {
  const defaultClientOptions = {} as ClientOptions;
  const fakeClient = {
    type: "openai",
    modelName: "gpt-4o",
    clientOptions: defaultClientOptions,
  } as LLMClient;
  const resolveLlmClient = vi.fn().mockReturnValue(fakeClient);

  return new ExtractHandler(
    fakeClient,
    "gpt-4o",
    defaultClientOptions,
    resolveLlmClient,
    undefined,
    false,
    false,
    options.onMetrics,
  );
}

interface BuildObserveHandlerOptions {
  onMetrics?: (
    functionName: V3FunctionName,
    promptTokens: number,
    completionTokens: number,
    reasoningTokens: number,
    cachedInputTokens: number,
    inferenceTimeMs: number,
  ) => void;
}

function buildObserveHandler(
  options: BuildObserveHandlerOptions = {},
): ObserveHandler {
  const defaultClientOptions = {} as ClientOptions;
  const fakeClient = {
    type: "openai",
    modelName: "gpt-4o",
    clientOptions: defaultClientOptions,
  } as LLMClient;
  const resolveLlmClient = vi.fn().mockReturnValue(fakeClient);

  return new ObserveHandler(
    fakeClient,
    "gpt-4o",
    defaultClientOptions,
    resolveLlmClient,
    undefined,
    false,
    false,
    options.onMetrics,
  );
}


================================================
FILE: packages/core/tests/unit/understudy-command-exception.test.ts
================================================
import { describe, expect, it } from "vitest";
import {
  UnderstudyCommandException,
  StagehandError,
} from "../../lib/v3/types/public/sdkErrors.js";

describe("UnderstudyCommandException", () => {
  it("extends StagehandError", () => {
    const err = new UnderstudyCommandException("test");
    expect(err).toBeInstanceOf(StagehandError);
    expect(err).toBeInstanceOf(Error);
  });

  it("has the correct name", () => {
    const err = new UnderstudyCommandException("test");
    expect(err.name).toBe("UnderstudyCommandException");
  });

  it("preserves the message", () => {
    const err = new UnderstudyCommandException("something broke");
    expect(err.message).toBe("something broke");
  });

  it("stores the original error as cause when provided", () => {
    const original = new Error("root cause");
    const err = new UnderstudyCommandException("wrapper message", original);

    expect(err.cause).toBe(original);
    expect((err.cause as Error).message).toBe("root cause");
    expect((err.cause as Error).stack).toBeDefined();
  });

  it("stores non-Error cause values", () => {
    const err = new UnderstudyCommandException("failed", "string cause");
    expect(err.cause).toBe("string cause");
  });

  it("has undefined cause when none is provided", () => {
    const err = new UnderstudyCommandException("no cause");
    expect(err.cause).toBeUndefined();
  });

  it("generates its own stack trace", () => {
    const err = new UnderstudyCommandException("test");
    expect(err.stack).toBeDefined();
    expect(err.stack).toContain("UnderstudyCommandException");
  });

  it("preserves the original stack via cause for debugging", () => {
    function deepFunction() {
      throw new Error("deep error");
    }

    let original: Error;
    try {
      deepFunction();
    } catch (e) {
      original = e as Error;
    }

    const wrapped = new UnderstudyCommandException(original!.message, original);

    // The wrapper has its own stack
    expect(wrapped.stack).toBeDefined();
    // The original stack is accessible via cause
    expect((wrapped.cause as Error).stack).toContain("deepFunction");
  });
});


================================================
FILE: packages/core/tests/unit/xpath-parser.test.ts
================================================
import { describe, expect, it } from "vitest";
import {
  applyPredicates,
  parseXPathSteps,
  type XPathPredicate,
} from "../../lib/v3/dom/locatorScripts/xpathParser.js";

describe("parseXPathSteps", () => {
  describe("basic tag parsing", () => {
    it("parses a simple absolute path", () => {
      expect(parseXPathSteps("/html/body/div")).toEqual([
        { axis: "child", tag: "html", predicates: [] },
        { axis: "child", tag: "body", predicates: [] },
        { axis: "child", tag: "div", predicates: [] },
      ]);
    });

    it("lowercases tag names", () => {
      const steps = parseXPathSteps("/HTML/BODY");
      expect(steps[0].tag).toBe("html");
      expect(steps[1].tag).toBe("body");
    });

    it("treats wildcard correctly", () => {
      const steps = parseXPathSteps("//*");
      expect(steps).toEqual([{ axis: "desc", tag: "*", predicates: [] }]);
    });
  });

  describe("axes", () => {
    it("distinguishes child (/) from descendant (//)", () => {
      const steps = parseXPathSteps("/html//div/span");
      expect(steps).toEqual([
        { axis: "child", tag: "html", predicates: [] },
        { axis: "desc", tag: "div", predicates: [] },
        { axis: "child", tag: "span", predicates: [] },
      ]);
    });

    it("handles leading //", () => {
      const steps = parseXPathSteps("//div");
      expect(steps[0].axis).toBe("desc");
    });
  });

  describe("positional indices", () => {
    it("parses positional index", () => {
      const steps = parseXPathSteps("/div[1]/span[3]");
      expect(steps[0]).toMatchObject({
        tag: "div",
        predicates: [{ type: "index", index: 1 }],
      });
      expect(steps[1]).toMatchObject({
        tag: "span",
        predicates: [{ type: "index", index: 3 }],
      });
    });

    it("clamps index to minimum 1", () => {
      const steps = parseXPathSteps("/div[0]");
      expect(steps[0].predicates[0]).toMatchObject({
        type: "index",
        index: 1,
      });
    });

    it("keeps multiple positional predicates in order", () => {
      const steps = parseXPathSteps("//div[2][3]");
      expect(steps[0].predicates).toEqual([
        { type: "index", index: 2 },
        { type: "index", index: 3 },
      ]);
    });
  });

  describe("attribute predicates", () => {
    it("parses single attribute predicate with single quotes", () => {
      const steps = parseXPathSteps("//img[@alt='Stagehand']");
      expect(steps).toEqual([
        {
          axis: "desc",
          tag: "img",
          predicates: [{ type: "attrEquals", name: "alt", value: "Stagehand" }],
        },
      ]);
    });

    it("parses single attribute predicate with double quotes", () => {
      const steps = parseXPathSteps('//img[@alt="Stagehand"]');
      expect(steps[0].predicates).toEqual([
        { type: "attrEquals", name: "alt", value: "Stagehand" },
      ]);
    });

    it("parses multiple attribute predicates", () => {
      const steps = parseXPathSteps("//div[@class='foo'][@id='bar']");
      expect(steps[0].predicates).toEqual([
        { type: "attrEquals", name: "class", value: "foo" },
        { type: "attrEquals", name: "id", value: "bar" },
      ]);
    });

    it("parses attribute predicate combined with positional index", () => {
      const steps = parseXPathSteps("//div[@class='item'][2]");
      expect(steps[0]).toMatchObject({
        tag: "div",
        predicates: [
          { type: "attrEquals", name: "class", value: "item" },
          { type: "index", index: 2 },
        ],
      });
    });

    it("parses attribute with hyphenated name", () => {
      const steps = parseXPathSteps("//div[@data-testid='submit']");
      expect(steps[0].predicates).toEqual([
        { type: "attrEquals", name: "data-testid", value: "submit" },
      ]);
    });

    it("parses attribute with empty value", () => {
      const steps = parseXPathSteps("//input[@value='']");
      expect(steps[0].predicates).toEqual([
        { type: "attrEquals", name: "value", value: "" },
      ]);
    });

    it("parses attribute value containing closing bracket", () => {
      const steps = parseXPathSteps("//div[@title='array[0]']");
      expect(steps[0].predicates).toEqual([
        { type: "attrEquals", name: "title", value: "array[0]" },
      ]);
    });

    it("parses attribute value containing multiple brackets", () => {
      const steps = parseXPathSteps("//div[@data-json='[1,2,3]']");
      expect(steps[0].predicates).toEqual([
        { type: "attrEquals", name: "data-json", value: "[1,2,3]" },
      ]);
    });

    it("parses attribute value containing a closing bracket", () => {
      // The step splitter should ignore ] characters inside quotes.
      const steps = parseXPathSteps("//div[@title='a]b']/span");
      expect(steps).toEqual([
        {
          axis: "desc",
          tag: "div",
          predicates: [{ type: "attrEquals", name: "title", value: "a]b" }],
        },
        { axis: "child", tag: "span", predicates: [] },
      ]);
    });

    it("parses attribute existence predicates", () => {
      const steps = parseXPathSteps("//iframe[@data-test]");
      expect(steps[0].predicates).toEqual([
        { type: "attrExists", name: "data-test" },
      ]);
    });

    it("parses attribute contains predicates", () => {
      const steps = parseXPathSteps("//iframe[contains(@src,'checkout')]");
      expect(steps[0].predicates).toEqual([
        { type: "attrContains", name: "src", value: "checkout" },
      ]);
    });

    it("parses attribute starts-with predicates", () => {
      const steps = parseXPathSteps("//button[starts-with(@id,'save-')]");
      expect(steps[0].predicates).toEqual([
        { type: "attrStartsWith", name: "id", value: "save-" },
      ]);
    });
  });

  describe("text predicates", () => {
    it("parses text equality", () => {
      const steps = parseXPathSteps("//button[text()='Submit']");
      expect(steps[0].predicates).toEqual([
        { type: "textEquals", value: "Submit" },
      ]);
    });

    it("parses text contains", () => {
      const steps = parseXPathSteps("//div[contains(text(),'Welcome')]");
      expect(steps[0].predicates).toEqual([
        { type: "textContains", value: "Welcome" },
      ]);
    });

    it("parses normalize-space on text", () => {
      const steps = parseXPathSteps(
        "//div[normalize-space(text())='Hello world']",
      );
      expect(steps[0].predicates).toEqual([
        { type: "textEquals", value: "Hello world", normalize: true },
      ]);
    });
  });

  describe("boolean predicates", () => {
    it("parses and predicates", () => {
      const steps = parseXPathSteps("//div[@a='x' and @b='y']");
      expect(steps[0].predicates).toEqual([
        {
          type: "and",
          predicates: [
            { type: "attrEquals", name: "a", value: "x" },
            { type: "attrEquals", name: "b", value: "y" },
          ],
        },
      ]);
    });

    it("parses operators without surrounding whitespace", () => {
      const steps = parseXPathSteps("//div[not(@x)and@y='z']");
      expect(steps[0].predicates).toEqual([
        {
          type: "and",
          predicates: [
            { type: "not", predicate: { type: "attrExists", name: "x" } },
            { type: "attrEquals", name: "y", value: "z" },
          ],
        },
      ]);
    });

    it("parses or predicates", () => {
      const steps = parseXPathSteps("//div[@a='x' or @b='y']");
      expect(steps[0].predicates).toEqual([
        {
          type: "or",
          predicates: [
            { type: "attrEquals", name: "a", value: "x" },
            { type: "attrEquals", name: "b", value: "y" },
          ],
        },
      ]);
    });

    it("parses not predicates", () => {
      const steps = parseXPathSteps("//button[not(@disabled)]");
      expect(steps[0].predicates).toEqual([
        { type: "not", predicate: { type: "attrExists", name: "disabled" } },
      ]);
    });

    it("does not treat @and as a boolean operator", () => {
      const steps = parseXPathSteps("//div[@and='x' and @y='z']");
      expect(steps[0].predicates).toEqual([
        {
          type: "and",
          predicates: [
            { type: "attrEquals", name: "and", value: "x" },
            { type: "attrEquals", name: "y", value: "z" },
          ],
        },
      ]);
    });
  });

  describe("multi-step with predicates", () => {
    it("parses complex path with mixed predicates", () => {
      const steps = parseXPathSteps(
        "/html/body//div[@class='container']/ul/li[3]",
      );
      expect(steps).toEqual([
        { axis: "child", tag: "html", predicates: [] },
        { axis: "child", tag: "body", predicates: [] },
        {
          axis: "desc",
          tag: "div",
          predicates: [
            { type: "attrEquals", name: "class", value: "container" },
          ],
        },
        { axis: "child", tag: "ul", predicates: [] },
        { axis: "child", tag: "li", predicates: [{ type: "index", index: 3 }] },
      ]);
    });
  });

  describe("edge cases", () => {
    it("returns empty array for empty string", () => {
      expect(parseXPathSteps("")).toEqual([]);
    });

    it("strips xpath= prefix", () => {
      const steps = parseXPathSteps("xpath=//div");
      expect(steps).toEqual([{ axis: "desc", tag: "div", predicates: [] }]);
    });

    it("strips XPATH= prefix (case-insensitive)", () => {
      const steps = parseXPathSteps("XPATH=//div");
      expect(steps).toEqual([{ axis: "desc", tag: "div", predicates: [] }]);
    });

    it("handles forward slashes inside attribute values", () => {
      const steps = parseXPathSteps("//a[@href='/api/endpoint']");
      expect(steps).toEqual([
        {
          axis: "desc",
          tag: "a",
          predicates: [
            { type: "attrEquals", name: "href", value: "/api/endpoint" },
          ],
        },
      ]);
    });

    it("handles URL attribute values with multiple slashes", () => {
      const steps = parseXPathSteps(
        "//a[@data-url='http://example.com/path/to/page']",
      );
      expect(steps).toEqual([
        {
          axis: "desc",
          tag: "a",
          predicates: [
            {
              type: "attrEquals",
              name: "data-url",
              value: "http://example.com/path/to/page",
            },
          ],
        },
      ]);
    });

    it("handles whitespace", () => {
      const steps = parseXPathSteps("  //div  ");
      expect(steps.length).toBe(1);
      expect(steps[0].tag).toBe("div");
    });
  });
});

describe("applyPredicates", () => {
  const makeElement = (id: string): Element => {
    return {
      localName: "div",
      getAttribute: (name: string) => (name === "id" ? id : null),
    } as unknown as Element;
  };

  it("applies positional predicates sequentially", () => {
    const elements = ["a", "b", "c", "d"].map(makeElement);
    const predicates: XPathPredicate[] = [
      { type: "index", index: 2 },
      { type: "index", index: 3 },
    ];
    expect(applyPredicates(elements, predicates)).toEqual([]);
  });
});


================================================
FILE: packages/core/tests/unit/xpath-resolver.test.ts
================================================
import { JSDOM } from "jsdom";
import { afterAll, beforeAll, beforeEach, describe, expect, it } from "vitest";
import {
  countXPathMatches,
  resolveXPathAtIndex,
} from "../../lib/v3/dom/locatorScripts/xpathResolver.js";

type DomGlobals = {
  window: Window & typeof globalThis;
  document: Document;
  Node: typeof Node;
  NodeFilter: typeof NodeFilter;
  Element: typeof Element;
  HTMLElement: typeof HTMLElement;
  Document: typeof Document;
  DocumentFragment: typeof DocumentFragment;
  ShadowRoot: typeof ShadowRoot;
  XPathResult: typeof XPathResult;
};

const globalRef = globalThis as typeof globalThis & Partial<DomGlobals>;
const originalGlobals: Partial<DomGlobals> = {
  window: globalRef.window,
  document: globalRef.document,
  Node: globalRef.Node,
  NodeFilter: globalRef.NodeFilter,
  Element: globalRef.Element,
  HTMLElement: globalRef.HTMLElement,
  Document: globalRef.Document,
  DocumentFragment: globalRef.DocumentFragment,
  ShadowRoot: globalRef.ShadowRoot,
  XPathResult: globalRef.XPathResult,
};

let dom: JSDOM;

const installDomGlobals = () => {
  const win = dom.window;
  globalRef.window = win as unknown as Window & typeof globalThis;
  globalRef.document = win.document;
  globalRef.Node = win.Node as unknown as typeof Node;
  globalRef.NodeFilter = win.NodeFilter as unknown as typeof NodeFilter;
  globalRef.Element = win.Element as unknown as typeof Element;
  globalRef.HTMLElement = win.HTMLElement as unknown as typeof HTMLElement;
  globalRef.Document = win.Document as unknown as typeof Document;
  globalRef.DocumentFragment =
    win.DocumentFragment as unknown as typeof DocumentFragment;
  globalRef.ShadowRoot = win.ShadowRoot as unknown as typeof ShadowRoot;
  globalRef.XPathResult = win.XPathResult as unknown as typeof XPathResult;
};

const restoreDomGlobals = () => {
  for (const [key, value] of Object.entries(originalGlobals)) {
    if (value === undefined) {
      delete (globalRef as Record<string, unknown>)[key];
    } else {
      (globalRef as Record<string, unknown>)[key] = value;
    }
  }
};

describe("xpathResolver composed traversal", () => {
  beforeAll(() => {
    dom = new JSDOM("<!doctype html><html><body></body></html>");
    installDomGlobals();
  });

  afterAll(() => {
    dom.window.close();
    restoreDomGlobals();
  });

  beforeEach(() => {
    document.body.innerHTML = "";
  });

  it("counts matches across light + shadow DOM without double counting", () => {
    document.body.innerHTML =
      '<div id="light-1"></div>' +
      '<shadow-host id="host"></shadow-host>' +
      '<div id="light-2"></div>';

    const host = document.getElementById("host") as HTMLElement;
    const shadow = host.attachShadow({ mode: "open" });
    shadow.innerHTML = '<div id="shadow-1"></div><div id="shadow-2"></div>';

    expect(countXPathMatches("//div")).toBe(4);
  });

  it("resolves nth over composed tree in document-order DFS", () => {
    document.body.innerHTML =
      '<div id="light-1"></div>' +
      '<shadow-host id="host"></shadow-host>' +
      '<div id="light-2"></div>';

    const host = document.getElementById("host") as HTMLElement;
    const shadow = host.attachShadow({ mode: "open" });
    shadow.innerHTML = '<div id="shadow-1"></div><div id="shadow-2"></div>';

    expect(resolveXPathAtIndex("//div", 0)?.id).toBe("light-1");
    expect(resolveXPathAtIndex("//div", 1)?.id).toBe("shadow-1");
    expect(resolveXPathAtIndex("//div", 2)?.id).toBe("shadow-2");
    expect(resolveXPathAtIndex("//div", 3)?.id).toBe("light-2");
  });
});


================================================
FILE: packages/core/tests/unit/zod-enum-compatibility.test.ts
================================================
import { describe, expect, it } from "vitest";
import * as z3 from "zod/v3";
import { z as z4 } from "zod";
import { SupportedUnderstudyAction } from "../../lib/v3/types/private/handlers.js";

/**
 * Tests for Zod v3/v4 compatibility with the SupportedUnderstudyAction enum.
 *
 * This test ensures that z.enum() works correctly with both Zod v3 and v4.
 * The key issue is that z.enum() in Zod v3 does NOT accept TypeScript enums directly -
 * it only accepts string literal tuples. For TypeScript enums, you need to use
 * Object.values() to convert the enum to an array first.
 *
 * In Zod v4, z.enum() was updated to accept TypeScript enums directly, but for
 * backwards compatibility, we should use Object.values() which works with both.
 *
 * See PR #1613: https://github.com/browserbase/stagehand/pull/1613
 */
describe("SupportedUnderstudyAction enum Zod compatibility", () => {
  const testInput = {
    elementId: "1-2",
    method: "click",
    arguments: [] as string[],
  };

  const invalidInput = {
    elementId: "1-2",
    method: "invalidMethod",
    arguments: [] as string[],
  };

  it("Object.values(SupportedUnderstudyAction) produces correct array for z.enum()", () => {
    const enumValues = Object.values(
      SupportedUnderstudyAction,
    ) as unknown as readonly [string, ...string[]];

    expect(enumValues).toContain("click");
    expect(enumValues).toContain("fill");
    expect(enumValues).toContain("type");
    expect(enumValues).toContain("press");
    expect(enumValues).toContain("scrollTo");
    expect(enumValues).toContain("nextChunk");
    expect(enumValues).toContain("prevChunk");
    expect(enumValues).toContain("selectOptionFromDropdown");
    expect(enumValues).toContain("hover");
    expect(enumValues).toContain("doubleClick");
    expect(enumValues).toContain("dragAndDrop");
    expect(enumValues.length).toBe(11);
  });

  it("Zod v3 z.enum() with Object.values(SupportedUnderstudyAction) works correctly", () => {
    const enumValues = Object.values(
      SupportedUnderstudyAction,
    ) as unknown as readonly [string, ...string[]];

    const schema = z3.z.object({
      elementId: z3.z.string(),
      method: z3.z.enum(enumValues),
      arguments: z3.z.array(z3.z.string()),
    });

    // Valid input should pass
    const validResult = schema.safeParse(testInput);
    expect(validResult.success).toBe(true);
    if (validResult.success) {
      expect(validResult.data.method).toBe("click");
    }

    // Invalid input should fail
    const invalidResult = schema.safeParse(invalidInput);
    expect(invalidResult.success).toBe(false);
  });

  it("Zod v4 z.enum() with Object.values(SupportedUnderstudyAction) works correctly", () => {
    const enumValues = Object.values(
      SupportedUnderstudyAction,
    ) as unknown as readonly [string, ...string[]];

    const schema = z4.object({
      elementId: z4.string(),
      method: z4.enum(enumValues),
      arguments: z4.array(z4.string()),
    });

    // Valid input should pass
    const validResult = schema.safeParse(testInput);
    expect(validResult.success).toBe(true);
    if (validResult.success) {
      expect(validResult.data.method).toBe("click");
    }

    // Invalid input should fail
    const invalidResult = schema.safeParse(invalidInput);
    expect(invalidResult.success).toBe(false);
  });

  it("Zod v3 z.enum() with raw TypeScript enum throws error on parse", () => {
    // This demonstrates the bug that PR #1613 would introduce
    // In Zod v3, z.enum() does NOT accept TypeScript enums directly
    // The schema creation might succeed, but parsing will fail

    const schema = z3.z.object({
      elementId: z3.z.string(),
      // eslint-disable-next-line @typescript-eslint/no-explicit-any
      method: z3.z.enum(SupportedUnderstudyAction as any),
      arguments: z3.z.array(z3.z.string()),
    });

    // This should throw an error because the enum is not iterable
    expect(() => schema.safeParse(testInput)).toThrow("object is not iterable");
  });

  it("Zod v4 z.enum() with raw TypeScript enum works (but not v3 compatible)", () => {
    // Zod v4 allows passing TypeScript enums directly to z.enum()
    // But this approach is NOT backwards compatible with v3

    const schema = z4.object({
      elementId: z4.string(),
      method: z4.enum(SupportedUnderstudyAction),
      arguments: z4.array(z4.string()),
    });

    // In v4, this works fine
    const validResult = schema.safeParse(testInput);
    expect(validResult.success).toBe(true);
  });

  it("All SupportedUnderstudyAction values are valid enum options", () => {
    const enumValues = Object.values(
      SupportedUnderstudyAction,
    ) as unknown as readonly [string, ...string[]];

    // Test with both v3 and v4 schemas
    const v3Schema = z3.z.enum(enumValues);
    const v4Schema = z4.enum(enumValues);

    for (const action of enumValues) {
      expect(v3Schema.safeParse(action).success).toBe(true);
      expect(v4Schema.safeParse(action).success).toBe(true);
    }
  });
});


================================================
FILE: packages/core/tsconfig.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "baseUrl": "../../",
    "rootDir": ".",
    "outDir": "./dist/esm",
    "allowJs": true,
    "paths": {
      "@browserbasehq/stagehand": ["packages/core/lib/v3/index.ts"],
      "@browserbasehq/stagehand/*": ["packages/core/lib/*"],
      "*": ["node_modules/*", "packages/core/lib/types/*"],
      "@/*": ["./*"]
    }
  },
  "include": [
    "lib/**/*.ts",
    "tests/**/*.ts",
    "lib/v3/cli.js"
  ],
  "exclude": ["node_modules", "dist", "lib/v3/dom/gen*.ts"]
}


================================================
FILE: packages/core/vitest.cjs.config.mjs
================================================
import { defineConfig } from "vitest/config";
import path from "node:path";
import { fileURLToPath } from "node:url";

const rootDir = path.dirname(fileURLToPath(import.meta.url));

export default defineConfig({
  resolve: {
    alias: {
      "@browserbasehq/stagehand": path.join(rootDir, "dist", "cjs", "index.js"),
    },
  },
  test: {
    environment: "node",
    include: ["**/dist/cjs/tests/unit/**/*.test.js"],
  },
});


================================================
FILE: packages/core/vitest.config.ts
================================================
import { defineConfig } from "vitest/config";
import path from "node:path";
import { fileURLToPath } from "node:url";

const rootDir = path.dirname(fileURLToPath(import.meta.url));

export default defineConfig({
  resolve: {
    alias: {
      "@browserbasehq/stagehand": path.join(rootDir, "dist", "esm", "index.js"),
    },
  },
  test: {
    environment: "node",
    include: ["**/dist/esm/tests/unit/**/*.test.js"],
  },
});


================================================
FILE: packages/core/vitest.esm.config.mjs
================================================
import { defineConfig } from "vitest/config";
import path from "node:path";
import { fileURLToPath } from "node:url";

const rootDir = path.dirname(fileURLToPath(import.meta.url));

export default defineConfig({
  resolve: {
    alias: {
      "@browserbasehq/stagehand": path.join(rootDir, "dist", "esm", "index.js"),
    },
  },
  test: {
    environment: "node",
    include: ["**/dist/esm/tests/unit/**/*.test.js"],
  },
});


================================================
FILE: packages/docs/.gitignore
================================================
node_modules
downloads
.DS_Store

================================================
FILE: packages/docs/README.md
================================================
# Mintlify Starter Kit

Click on `Use this template` to copy the Mintlify starter kit. The starter kit contains examples including

- Guide pages
- Navigation
- Customizations
- API Reference pages
- Use of popular components

### Development

Install dependencies with pnpm

```
pnpm install
```

Run the following command at the root of your documentation (where mint.json is)

```
pnpm mintlify dev
```

### Publishing Changes

Install our Github App to auto propagate changes from your repo to your deployment. Changes will be deployed to production automatically after pushing to the default branch. Find the link to install on your dashboard.

#### Troubleshooting

- Mintlify dev isn't running - Run `mintlify install` it'll re-install dependencies.
- Page loads as a 404 - Make sure you are running in a folder with `mint.json`


================================================
FILE: packages/docs/docs.json
================================================
{
  "$schema": "https://mintlify.com/docs.json",
  "theme": "willow",
  "name": "🤘 Stagehand",
  "colors": {
    "primary": "#B88100",
    "light": "#FFC83C",
    "dark": "#FFC83C"
  },
  "favicon": "/images/favicon.svg",
  "seo": {
    "indexing": "all",
    "metatags": {
      "og:type": "website",
      "og:site_name": "Stagehand Docs"
    }
  },
  "openapi": "https://app.stainless.com/api/spec/documented/stagehand/openapi.documented.yml",
  "navigation": {
    "versions": [
      {
        "version": "v3",
        "dropdowns": [
          {
            "dropdown": "TypeScript",
            "icon": "code",
            "pages": [
              "v3/first-steps/introduction"
            ],
            "groups": [
              {
                "group": "First Steps",
                "pages": [
                  "v3/first-steps/introduction",
                  "v3/first-steps/quickstart",
                  "v3/first-steps/installation",
                  "v3/first-steps/ai-rules"
                ]
              },
              {
                "group": "The Basics",
                "pages": [
                  "v3/basics/agent",
                  "v3/basics/act",
                  "v3/basics/extract",
                  "v3/basics/observe",
                  "v3/basics/evals"
                ]
              },
              {
                "group": "Configuration",
                "pages": [
                  "v3/configuration/browser",
                  "v3/configuration/observability",
                  "v3/configuration/logging",
                  "v3/configuration/models"
                ]
              },
              {
                "group": "Best Practices",
                "pages": [
                  "v3/best-practices/caching",
                  "v3/best-practices/cost-optimization",
                  "v3/best-practices/deterministic-agent",
                  "v3/best-practices/using-multiple-tabs",
                  "v3/best-practices/deployments",
                  "v3/best-practices/history",
                  "v3/best-practices/computer-use",
                  "v3/best-practices/agent-fallbacks",
                  "v3/best-practices/prompting-best-practices",
                  "v3/best-practices/mcp-integrations",
                  "v3/best-practices/speed-optimization"
                ]
              },
              {
                "group": "Integrations",
                "pages": [
                  {
                    "group": "MCP Server",
                    "pages": [
                      "v3/integrations/mcp/introduction",
                      "v3/integrations/mcp/setup",
                      "v3/integrations/mcp/tools",
                      "v3/integrations/mcp/configuration"
                    ]
                  },
                  {
                    "group": "CrewAI",
                    "pages": [
                      "v3/integrations/crew-ai/introduction",
                      "v3/integrations/crew-ai/configuration"
                    ]
                  },
                  {
                    "group": "Langchain",
                    "pages": [
                      "v3/integrations/langchain/introduction",
                      "v3/integrations/langchain/configuration"
                    ]
                  },
                  {
                    "group": "Next.js + Vercel",
                    "pages": [
                      "v3/integrations/vercel/introduction",
                      "v3/integrations/vercel/configuration"
                    ]
                  },
                  {
                    "group": "Convex",
                    "pages": [
                      "v3/integrations/convex/introduction",
                      "v3/integrations/convex/configuration"
                    ]
                  },
                  "v3/integrations/playwright",
                  "v3/integrations/puppeteer",
                  "v3/integrations/selenium"
                ]
              },
              {
                "group": "Reference",
                "pages": [
                  "v3/references/stagehand",
                  "v3/references/agent",
                  "v3/references/act",
                  "v3/references/extract",
                  "v3/references/observe",
                  "v3/references/context",
                  "v3/references/page",
                  "v3/references/locator",
                  "v3/references/deeplocator",
                  "v3/references/response"
                ]
              },
              {
                "group": "Migration Guides",
                "pages": [
                  "v3/migrations/v2",
                  "v3/migrations/python"
                ]
              }
            ]
          },
          {
            "dropdown": "Python",
            "icon": "code",
            "pages": [
              "v3/sdk/python"
            ],
            "groups": [
              {
                "group": "SDK Reference",
                "pages": [
                  "v3/sdk/python"
                ]
              },
              {
                "group": "API Reference",
                "openapi": {
                  "source": "https://app.stainless.com/api/spec/documented/stagehand/openapi.documented.yml",
                  "directory": "v3/api-reference/python"
                },
                "pages": [
                  "POST /v1/sessions/start",
                  "POST /v1/sessions/{id}/navigate",
                  "POST /v1/sessions/{id}/act",
                  "POST /v1/sessions/{id}/observe",
                  "POST /v1/sessions/{id}/extract",
                  "POST /v1/sessions/{id}/agentExecute",
                  "POST /v1/sessions/{id}/end",
                  "GET /v1/sessions/{id}/replay"
                ]
              }
            ]
          },
          {
            "dropdown": "Java",
            "icon": "code",
            "pages": [
              "v3/sdk/java"
            ],
            "groups": [
              {
                "group": "SDK Reference",
                "pages": [
                  "v3/sdk/java"
                ]
              },
              {
                "group": "API Reference",
                "openapi": {
                  "source": "https://app.stainless.com/api/spec/documented/stagehand/openapi.documented.yml",
                  "directory": "v3/api-reference/java"
                },
                "pages": [
                  "POST /v1/sessions/start",
                  "POST /v1/sessions/{id}/navigate",
                  "POST /v1/sessions/{id}/act",
                  "POST /v1/sessions/{id}/observe",
                  "POST /v1/sessions/{id}/extract",
                  "POST /v1/sessions/{id}/agentExecute",
                  "POST /v1/sessions/{id}/end",
                  "GET /v1/sessions/{id}/replay"
                ]
              }
            ]
          },
          {
            "dropdown": "Go",
            "icon": "code",
            "pages": [
              "v3/sdk/go"
            ],
            "groups": [
              {
                "group": "SDK Reference",
                "pages": [
                  "v3/sdk/go"
                ]
              },
              {
                "group": "API Reference",
                "openapi": {
                  "source": "https://app.stainless.com/api/spec/documented/stagehand/openapi.documented.yml",
                  "directory": "v3/api-reference/go"
                },
                "pages": [
                  "POST /v1/sessions/start",
                  "POST /v1/sessions/{id}/navigate",
                  "POST /v1/sessions/{id}/act",
                  "POST /v1/sessions/{id}/observe",
                  "POST /v1/sessions/{id}/extract",
                  "POST /v1/sessions/{id}/agentExecute",
                  "POST /v1/sessions/{id}/end",
                  "GET /v1/sessions/{id}/replay"
                ]
              }
            ]
          },
          {
            "dropdown": "Ruby",
            "icon": "code",
            "pages": [
              "v3/sdk/ruby"
            ],
            "groups": [
              {
                "group": "SDK Reference",
                "pages": [
                  "v3/sdk/ruby"
                ]
              },
              {
                "group": "API Reference",
                "openapi": {
                  "source": "https://app.stainless.com/api/spec/documented/stagehand/openapi.documented.yml",
                  "directory": "v3/api-reference/ruby"
                },
                "pages": [
                  "POST /v1/sessions/start",
                  "POST /v1/sessions/{id}/navigate",
                  "POST /v1/sessions/{id}/act",
                  "POST /v1/sessions/{id}/observe",
                  "POST /v1/sessions/{id}/extract",
                  "POST /v1/sessions/{id}/agentExecute",
                  "POST /v1/sessions/{id}/end",
                  "GET /v1/sessions/{id}/replay"
                ]
              }
            ]
          }
        ]
      },
      {
        "version": "v2",
        "groups": [
          {
            "group": "First Steps",
            "pages": [
              "v2/first-steps/introduction",
              "v2/first-steps/quickstart",
              "v2/first-steps/installation",
              "v2/first-steps/ai-rules"
            ]
          },
          {
            "group": "The Basics",
            "pages": [
              "v2/basics/agent",
              "v2/basics/act",
              "v2/basics/extract",
              "v2/basics/observe"
            ]
          },
          {
            "group": "Configuration",
            "pages": [
              "v2/configuration/browser",
              "v2/configuration/observability",
              "v2/configuration/logging",
              "v2/configuration/models",
              "v2/configuration/evals"
            ]
          },
          {
            "group": "Best Practices",
            "pages": [
              "v2/best-practices/caching",
              "v2/best-practices/cost-optimization",
              "v2/best-practices/using-multiple-tabs",
              "v2/best-practices/working-with-iframes",
              "v2/best-practices/deployments",
              "v2/best-practices/computer-use",
              "v2/best-practices/contributing",
              "v2/best-practices/playwright-interop",
              "v2/best-practices/build-agent",
              "v2/best-practices/agent-fallbacks",
              "v2/best-practices/prompting-best-practices",
              "v2/best-practices/mcp-integrations",
              "v2/best-practices/speed-optimization"
            ]
          },
          {
            "group": "Integrations",
            "pages": [
              {
                "group": "MCP Server",
                "pages": [
                  "v2/integrations/mcp/introduction",
                  "v2/integrations/mcp/setup",
                  "v2/integrations/mcp/tools",
                  "v2/integrations/mcp/configuration"
                ]
              },
              {
                "group": "CrewAI",
                "pages": [
                  "v2/integrations/crew-ai/introduction",
                  "v2/integrations/crew-ai/configuration"
                ]
              },
              {
                "group": "Langchain",
                "pages": [
                  "v2/integrations/langchain/introduction",
                  "v2/integrations/langchain/configuration"
                ]
              },
              {
                "group": "Next.js + Vercel",
                "pages": [
                  "v2/integrations/vercel/introduction",
                  "v2/integrations/vercel/configuration"
                ]
              }
            ]
          },
          {
            "group": "Reference",
            "pages": [
              "v2/references/stagehand",
              "v2/references/act",
              "v2/references/extract",
              "v2/references/observe",
              "v2/references/agent"
            ]
          }
        ]
      }
    ],
    "global": {
      "anchors": [
        {
          "anchor": "Discord",
          "href": "https://stagehand.dev/discord",
          "icon": "discord"
        },
        {
          "anchor": "GitHub",
          "href": "https://github.com/browserbase/stagehand",
          "icon": "github"
        },
        {
          "anchor": "Changelog",
          "href": "https://github.com/browserbase/stagehand/releases",
          "icon": "scroll"
        }
      ]
    }
  },
  "logo": {
    "light": "/logo/light_logo.png",
    "dark": "/logo/dark_logo.png",
    "href": "https://stagehand.dev"
  },
  "navbar": {
    "links": [
      {
        "label": "Discord",
        "href": "https://stagehand.dev/discord"
      },
      {
        "label": "Support",
        "href": "mailto:support@browserbase.com"
      }
    ]
  },
  "footer": {
    "socials": {
      "discord": "https://stagehand.dev/discord",
      "x": "https://x.com/stagehanddev",
      "github": "https://github.com/browserbase/stagehand",
      "linkedin": "https://linkedin.com/company/browserbasehq"
    }
  },
  "integrations": {
    "posthog": {
      "apiKey": "phc_hmwkFrlc9UVrdE1jyG8AEKoCQCSr8dScjsRpKoLBEiV",
      "apiHost": "https://us.i.posthog.com"
    }
  },
  "contextual": {
    "options": [
      "copy",
      "chatgpt",
      "claude",
      "view"
    ]
  },
  "redirects": [
    {
      "source": "/first-steps/:slug*",
      "destination": "/v3/first-steps/:slug*"
    },
    {
      "source": "/basics/:slug*",
      "destination": "/v3/basics/:slug*"
    },
    {
      "source": "/configuration/:slug*",
      "destination": "/v3/configuration/:slug*"
    },
    {
      "source": "/best-practices/:slug*",
      "destination": "/v3/best-practices/:slug*"
    },
    {
      "source": "/integrations/mcp/:slug*",
      "destination": "/v3/integrations/mcp/:slug*"
    },
    {
      "source": "/integrations/crew-ai/:slug*",
      "destination": "/v3/integrations/crew-ai/:slug*"
    },
    {
      "source": "/integrations/langchain/:slug*",
      "destination": "/v3/integrations/langchain/:slug*"
    },
    {
      "source": "/integrations/vercel/:slug*",
      "destination": "/v3/integrations/vercel/:slug*"
    },
    {
      "source": "/integrations/convex/:slug*",
      "destination": "/v3/integrations/convex/:slug*"
    },
    {
      "source": "/references/:slug*",
      "destination": "/v3/references/:slug*"
    },
    {
      "source": "/migrations/:slug*",
      "destination": "/v3/migrations/:slug*"
    }
  ]
}


================================================
FILE: packages/docs/language-selector.js
================================================
// Language switcher for Stagehand docs
// Handles: 1) Sidebar language dropdown selection 2) Code block language syncing

(function() {
  // ============================================
  // CONFIGURATION
  // ============================================

  const DROPDOWN_LANGUAGES = ['TypeScript', 'Python', 'Java', 'Go', 'Ruby'];

  const LANGUAGE_MAP = {
    'TypeScript': 'Javascript',
    'Python': 'Python',
    'Java': 'Java',
    'Go': 'Go',
    'Ruby': 'Ruby'
  };

  const CODE_BLOCK_LANGUAGES = ['Javascript', 'Python', 'Go', 'Java', 'Ruby', 'cURL', 'PHP'];

  const SDK_PATH_MAP = {
    'Python': 'python',
    'Java': 'java',
    'Go': 'go',
    'Ruby': 'ruby'
  };

  const NAVIGATION_MAP = {
    'TypeScript': '/v3/first-steps/introduction',
    'Python': '/v3/sdk/python',
    'Java': '/v3/sdk/java',
    'Go': '/v3/sdk/go',
    'Ruby': '/v3/sdk/ruby'
  };

  let currentSelectedLanguage = 'TypeScript';
  let isSelecting = false;

  // ============================================
  // UTILITIES
  // ============================================

  // Run callback on next frame (immediate visual update)
  const onNextFrame = (fn) => requestAnimationFrame(() => requestAnimationFrame(fn));

  const dropdownStyle = document.createElement('style');
  dropdownStyle.id = 'stagehand-language-style';
  dropdownStyle.textContent = `
    /* Hide dropdown during programmatic selection */
    .stagehand-selecting [role="menu"],
    .stagehand-selecting [role="listbox"] {
      opacity: 0 !important;
      pointer-events: none !important;
      transition: none !important;
    }
    
    /* Hide version switcher when non-TypeScript language is selected */
    .stagehand-hide-version-switcher .stagehand-version-switcher {
      display: none !important;
    }
    
    /* Hide SDK reference items that don't match the selected language */
    li[id^="/v3/sdk/"].stagehand-sdk-hidden {
      display: none !important;
    }
  `;
  document.head.appendChild(dropdownStyle);
  
  // ============================================
  // SDK REFERENCE FILTERING
  // ============================================
  
  function updateSDKReferenceVisibility() {
    // Get the SDK path for the current language
    const currentSDKPath = SDK_PATH_MAP[currentSelectedLanguage];
    
    // Find all SDK reference items in the sidebar
    const sdkItems = document.querySelectorAll('li[id^="/v3/sdk/"]');
    
    sdkItems.forEach(item => {
      const itemId = item.getAttribute('id') || '';
      // Extract the language from the id (e.g., "/v3/sdk/python" -> "python")
      const itemLang = itemId.split('/').pop();
      
      if (currentSelectedLanguage === 'TypeScript') {
        // For TypeScript, hide all SDK references (they don't apply)
        item.classList.add('stagehand-sdk-hidden');
      } else if (currentSDKPath && itemLang === currentSDKPath) {
        // Show the SDK that matches the current language
        item.classList.remove('stagehand-sdk-hidden');
      } else {
        // Hide SDKs that don't match
        item.classList.add('stagehand-sdk-hidden');
      }
    });
  }

  // ============================================
  // VERSION SWITCHER VISIBILITY
  // ============================================
  
  function getVersionSwitcher() {
    // Find the version switcher button (contains "v3" or "v2" and has chevron-down)
    const buttons = document.querySelectorAll('button');
    for (const btn of buttons) {
      const text = (btn.textContent || '').trim().toLowerCase();
      // Check if it's a version button (v2, v3, etc.) with chevron icon
      if (/^v\d+$/.test(text) && btn.querySelector('.lucide-chevron-down')) {
        return btn;
      }
    }
    return null;
  }
  
  function updateVersionSwitcherVisibility() {
    const versionSwitcher = getVersionSwitcher();
    
    if (versionSwitcher) {
      // Mark the version switcher so we can target it with CSS
      versionSwitcher.classList.add('stagehand-version-switcher');
      
      // Show version switcher only for TypeScript
      if (currentSelectedLanguage === 'TypeScript') {
        document.body.classList.remove('stagehand-hide-version-switcher');
      } else {
        document.body.classList.add('stagehand-hide-version-switcher');
      }
    }
  }
  
  // ============================================
  // SIDEBAR DROPDOWN FUNCTIONS
  // ============================================
  
  function getDropdownButton() {
    const buttons = document.querySelectorAll('button');
    for (const btn of buttons) {
      const text = (btn.textContent || '').trim();
      if (DROPDOWN_LANGUAGES.includes(text)) {
        return btn;
      }
    }
    return null;
  }
  
  function getDropdownMenu() {
    return document.querySelector('menu[role="menu"], [role="menu"]');
  }
  
  function updateButtonText(newText) {
    const button = getDropdownButton();
    if (!button) return;
    
    const paragraph = button.querySelector('p');
    if (paragraph) {
      paragraph.textContent = newText;
    }
  }
  
  function updateDropdownCheckIndicator() {
    const menu = getDropdownMenu();
    if (!menu) return;
    
    const menuItems = menu.querySelectorAll('a, [role="menuitem"]');
    const checkIconsMap = new Map();
    let anyCheckIcon = null;
    
    for (const item of menuItems) {
      const text = (item.textContent || '').trim();
      const checkIcon = item.querySelector('.lucide-check, [class*="lucide-check"], svg[class*="check"]');
      
      for (const lang of DROPDOWN_LANGUAGES) {
        if (text.includes(lang)) {
          checkIconsMap.set(lang, { item, checkIcon });
          if (checkIcon) {
            anyCheckIcon = checkIcon;
          }
          break;
        }
      }
    }
    
    for (const [lang, { item, checkIcon }] of checkIconsMap) {
      const shouldBeSelected = lang === currentSelectedLanguage;
      
      if (checkIcon) {
        checkIcon.style.opacity = shouldBeSelected ? '1' : '0';
        checkIcon.style.visibility = shouldBeSelected ? 'visible' : 'hidden';
      } else if (shouldBeSelected && anyCheckIcon) {
        const clonedCheck = anyCheckIcon.cloneNode(true);
        clonedCheck.style.opacity = '1';
        clonedCheck.style.visibility = 'visible';
        
        const targetSpan = item.querySelector('span:last-child') || item;
        if (targetSpan.querySelector('.lucide-check, [class*="lucide-check"]') === null) {
          targetSpan.appendChild(clonedCheck);
        }
      }
    }
  }
  
  // ============================================
  // CODE BLOCK LANGUAGE SELECTOR FUNCTIONS
  // ============================================
  
  function simulateClick(element) {
    if (!element) return;
    const rect = element.getBoundingClientRect();
    const x = rect.left + rect.width / 2;
    const y = rect.top + rect.height / 2;
    
    ['pointerdown', 'mousedown', 'pointerup', 'mouseup', 'click'].forEach(eventType => {
      const EventClass = eventType.startsWith('pointer') ? PointerEvent : MouseEvent;
      element.dispatchEvent(new EventClass(eventType, {
        view: window, bubbles: true, cancelable: true,
        clientX: x, clientY: y, button: 0, buttons: 1,
        isPrimary: true, pointerType: 'mouse'
      }));
    });
  }
  
  function getCodeBlockLanguageDropdown() {
    const paragraphs = document.querySelectorAll('p');
    
    for (const p of paragraphs) {
      const text = (p.textContent || '').trim();
      if (CODE_BLOCK_LANGUAGES.includes(text)) {
        const parentDiv = p.closest('div');
        if (parentDiv && parentDiv.querySelector('.lucide-chevrons-up-down')) {
          return { element: parentDiv, language: text };
        }
      }
    }
    return null;
  }
  
  function waitForCodeBlockMenuAndSelect(targetLanguage, attempts = 0) {
    if (attempts > 30) {
      document.body.classList.remove('stagehand-selecting');
      document.body.click();
      isSelecting = false;
      return;
    }

    const menuItems = document.querySelectorAll('[role="menuitem"], [role="option"]');

    if (menuItems.length === 0) {
      requestAnimationFrame(() => waitForCodeBlockMenuAndSelect(targetLanguage, attempts + 1));
      return;
    }

    for (const item of menuItems) {
      const text = (item.textContent || '').trim();
      if (text === targetLanguage) {
        simulateClick(item);
        onNextFrame(() => {
          document.body.classList.remove('stagehand-selecting');
          isSelecting = false;
        });
        return;
      }
    }

    requestAnimationFrame(() => waitForCodeBlockMenuAndSelect(targetLanguage, attempts + 1));
  }

  function selectCodeBlockLanguage(targetLanguage) {
    if (isSelecting) return;

    const current = getCodeBlockLanguageDropdown();
    if (!current) return;
    if (current.language === targetLanguage) return;

    isSelecting = true;
    document.body.classList.add('stagehand-selecting');
    simulateClick(current.element);
    requestAnimationFrame(() => waitForCodeBlockMenuAndSelect(targetLanguage));
  }

  function syncCodeBlockLanguage() {
    const codeBlockLang = LANGUAGE_MAP[currentSelectedLanguage];
    if (codeBlockLang) {
      selectCodeBlockLanguage(codeBlockLang);
    }
  }
  
  // ============================================
  // EVENT HANDLERS & OBSERVERS
  // ============================================
  
  function setupDropdownMenuObserver() {
    const menuObserver = new MutationObserver(() => {
      const menu = getDropdownMenu();
      if (menu) {
        updateDropdownCheckIndicator();
        onNextFrame(updateDropdownCheckIndicator);
      }
    });

    menuObserver.observe(document.body, {
      subtree: true,
      childList: true
    });
  }
  
  function setupMenuClickHandler() {
    document.addEventListener('click', (e) => {
      const target = e.target;
      
      // Check if we clicked on a sidebar dropdown menu item
      const menuItem = target.closest('[role="menu"] a, menu a');
      if (!menuItem) return;
      
      const text = (menuItem.textContent || '').trim();
      
      // Check if it's one of our language options
      for (const lang of DROPDOWN_LANGUAGES) {
        if (text.includes(lang)) {
          currentSelectedLanguage = lang;
          
          // Update the check indicator immediately
          updateDropdownCheckIndicator();
          
          // Update version switcher visibility
          updateVersionSwitcherVisibility();
          
          // Update SDK reference visibility
          updateSDKReferenceVisibility();
          
          // Store in sessionStorage
          try {
            sessionStorage.setItem('stagehand-selected-language', lang);
          } catch (err) {
            // Ignore storage errors
          }

          // Navigate to the corresponding SDK page
          const targetPath = NAVIGATION_MAP[lang];
          const normalizedPathname = window.location.pathname.replace(/\/$/, '');
          if (targetPath && !normalizedPathname.endsWith(targetPath)) {
            e.preventDefault();
            e.stopPropagation();
            window.location.href = targetPath;
            return;
          }

          // Update button text after menu closes
          onNextFrame(() => updateButtonText(lang));

          // Sync the code block language selector
          onNextFrame(syncCodeBlockLanguage);

          break;
        }
      }
    }, true);
  }
  
  function restoreLanguageSelection() {
    try {
      const stored = sessionStorage.getItem('stagehand-selected-language');
      if (stored && DROPDOWN_LANGUAGES.includes(stored)) {
        currentSelectedLanguage = stored;
        updateButtonText(stored);
        updateVersionSwitcherVisibility();
        updateSDKReferenceVisibility();
        onNextFrame(syncCodeBlockLanguage);
      }
    } catch (err) {
      // Ignore storage errors
    }

    // Always update visibility on restore
    onNextFrame(() => {
      updateVersionSwitcherVisibility();
      updateSDKReferenceVisibility();
    });
  }
  
  function setupPageChangeObserver() {
    let sdkUpdatePending = false;

    const observer = new MutationObserver(() => {
      // Check if button needs updating
      const button = getDropdownButton();
      if (button) {
        const currentText = (button.textContent || '').trim();
        if (currentText !== currentSelectedLanguage && DROPDOWN_LANGUAGES.includes(currentSelectedLanguage)) {
          updateButtonText(currentSelectedLanguage);
        }
      }

      // Re-check version switcher visibility (DOM might have re-rendered)
      const versionSwitcher = getVersionSwitcher();
      if (versionSwitcher && !versionSwitcher.classList.contains('stagehand-version-switcher')) {
        updateVersionSwitcherVisibility();
      }

      // Check for SDK reference items that need to be hidden (debounced via rAF)
      const sdkItems = document.querySelectorAll('li[id^="/v3/sdk/"]:not(.stagehand-sdk-processed)');
      if (sdkItems.length > 0 && !sdkUpdatePending) {
        sdkUpdatePending = true;
        onNextFrame(() => {
          updateSDKReferenceVisibility();
          document.querySelectorAll('li[id^="/v3/sdk/"]').forEach(item => {
            item.classList.add('stagehand-sdk-processed');
          });
          sdkUpdatePending = false;
        });
      }
    });

    observer.observe(document.body, {
      subtree: true,
      childList: true
    });
  }
  
  // Watch for code block dropdowns appearing and sync them
  function setupCodeBlockObserver() {
    let lastCodeBlockDropdown = null;

    const observer = new MutationObserver(() => {
      const dropdown = getCodeBlockLanguageDropdown();
      if (dropdown && dropdown.element !== lastCodeBlockDropdown) {
        lastCodeBlockDropdown = dropdown.element;

        // New code block dropdown appeared, sync it
        const targetLang = LANGUAGE_MAP[currentSelectedLanguage];
        if (targetLang && dropdown.language !== targetLang) {
          onNextFrame(() => selectCodeBlockLanguage(targetLang));
        }
      }
    });

    observer.observe(document.body, {
      subtree: true,
      childList: true
    });
  }
  
  // ============================================
  // INITIALIZATION
  // ============================================

  function init() {
    setupMenuClickHandler();
    setupDropdownMenuObserver();
    setupPageChangeObserver();
    setupCodeBlockObserver();

    restoreLanguageSelection();
    updateVersionSwitcherVisibility();
    updateSDKReferenceVisibility();
  }

  // Initialize on page load
  if (document.readyState === 'loading') {
    document.addEventListener('DOMContentLoaded', init);
  } else {
    init();
  }

  // Re-run when URL changes (SPA navigation)
  let lastUrl = location.href;
  const urlObserver = new MutationObserver(() => {
    if (location.href !== lastUrl) {
      lastUrl = location.href;
      // Remove processed class so SDK items get re-evaluated
      document.querySelectorAll('li[id^="/v3/sdk/"].stagehand-sdk-processed').forEach(item => {
        item.classList.remove('stagehand-sdk-processed');
      });
      onNextFrame(() => {
        restoreLanguageSelection();
        syncCodeBlockLanguage();
        updateVersionSwitcherVisibility();
        updateSDKReferenceVisibility();
      });
    }
  });
  urlObserver.observe(document.body, { subtree: true, childList: true });
})();


================================================
FILE: packages/docs/package.json
================================================
{
  "name": "@browserbasehq/stagehand-docs",
  "version": "1.0.0",
  "description": "",
  "type": "module",
  "main": "index.js",
  "scripts": {
    "dev": "mintlify dev --no-open --port 3002",
    "upgrade": "mintlify upgrade",
    "sync-sdk": "node scripts/sync-sdk-docs.js"
  },
  "keywords": [],
  "author": "",
  "license": "ISC",
  "dependencies": {
    "mintlify": "^4.2.47",
    "zod": "^4.2.1"
  },
  "packageManager": "pnpm@9.15.0+sha512.76e2379760a4328ec4415815bcd6628dee727af3779aaa4c914e3944156c4299921a89f976381ee107d41f12cfa4b66681ca9c718f0668fa0831ed4c6d8ba56c"
}


================================================
FILE: packages/docs/scripts/runtimePaths.js
================================================
/**
 * Keep this file in sync with:
 * - /packages/core/lib/v3/runtimePaths.ts
 * - /packages/server-v3/scripts/runtimePaths.ts
 * - /packages/server-v4/scripts/runtimePaths.ts
 * - /packages/evals/runtimePaths.ts
 * - /packages/docs/scripts/runtimePaths.js
 */
import path from "node:path";
import { fileURLToPath } from "node:url";

const PACKAGE_SEGMENT = "/packages/docs/";
const EVAL_FRAMES = new Set(["[eval]", "[eval]-wrapper"]);
const INTERNAL_FRAME_NAMES = new Set([
  "readCallsites",
  "readCallsitePath",
  "resolveCallerFilePath",
  "getCurrentFilePath",
  "getCurrentDirPath",
  "getRepoRootDir",
  "isMainModule",
]);

const normalizePath = (value) => {
  const input = value.startsWith("file://") ? fileURLToPath(value) : value;
  return path.resolve(input).replaceAll("\\", "/");
};

const readCallsites = () => {
  const previousPrepare = Error.prepareStackTrace;
  try {
    Error.prepareStackTrace = (_, stack) => stack;
    return new Error().stack ?? [];
  } finally {
    Error.prepareStackTrace = previousPrepare;
  }
};

const readCallsitePath = (callsite) => {
  const rawPath =
    callsite.getFileName?.() ?? callsite.getScriptNameOrSourceURL?.();
  if (!rawPath) return null;
  if (rawPath.startsWith("node:")) return null;
  if (EVAL_FRAMES.has(rawPath)) return null;
  return normalizePath(rawPath);
};

const isInternalCallsite = (callsite) => {
  const functionName = callsite.getFunctionName?.();
  if (functionName && INTERNAL_FRAME_NAMES.has(functionName)) return true;

  const methodName = callsite.getMethodName?.();
  if (methodName && INTERNAL_FRAME_NAMES.has(methodName)) return true;

  const callsiteString = callsite.toString?.() ?? "";
  for (const frameName of INTERNAL_FRAME_NAMES) {
    if (callsiteString.includes(`${frameName} (`)) return true;
    if (callsiteString.includes(`.${frameName} (`)) return true;
  }
  return false;
};

const resolveCallerFilePath = () => {
  const packageCandidates = [];
  const fallbackCandidates = [];

  for (const callsite of readCallsites()) {
    const filePath = readCallsitePath(callsite);
    if (!filePath) continue;
    if (isInternalCallsite(callsite)) continue;
    if (filePath.includes(PACKAGE_SEGMENT)) {
      packageCandidates.push(filePath);
      continue;
    }
    fallbackCandidates.push(filePath);
  }

  const packageCandidate = packageCandidates[0];
  if (packageCandidate) return packageCandidate;

  const fallbackCandidate = fallbackCandidates[0];
  if (fallbackCandidate) return fallbackCandidate;

  throw new Error("Unable to resolve caller file path.");
};

export const getCurrentFilePath = () => resolveCallerFilePath();

export const getCurrentDirPath = () => path.dirname(getCurrentFilePath());

export const getRepoRootDir = () => {
  const currentFilePath = getCurrentFilePath();
  const index = currentFilePath.lastIndexOf(PACKAGE_SEGMENT);
  if (index === -1) {
    throw new Error(
      `Unable to determine repo root from ${currentFilePath} (missing ${PACKAGE_SEGMENT}).`,
    );
  }
  return currentFilePath.slice(0, index);
};

export const isMainModule = () => {
  const entryScript = process.argv.at(1);
  if (!entryScript) return false;
  return normalizePath(entryScript) === getCurrentFilePath();
};


================================================
FILE: packages/docs/scripts/sync-sdk-docs.js
================================================
#!/usr/bin/env node

/**
 * Script to sync SDK documentation from GitHub READMEs
 * 
 * Usage: node scripts/sync-sdk-docs.js
 * 
 * This script fetches README.md files from each language SDK repo
 * and generates MDX files for the docs.
 */

import fs from "node:fs";
import path from "node:path";
import https from "node:https";
import { getCurrentDirPath } from "./runtimePaths.js";

const currentDir = getCurrentDirPath();

// SDK repos configuration
const SDK_REPOS = {
  java: {
    repo: 'browserbase/stagehand-java',
    title: 'Java SDK',
    description: 'Official Stagehand SDK for Java',
    outputPath: 'v3/sdk/java.mdx'
  },
  python: {
    repo: 'browserbase/stagehand-python',
    title: 'Python SDK',
    description: 'Official Stagehand SDK for Python',
    outputPath: 'v3/sdk/python.mdx'
  },
  ruby: {
    repo: 'browserbase/stagehand-ruby',
    title: 'Ruby SDK',
    description: 'Official Stagehand SDK for Ruby',
    outputPath: 'v3/sdk/ruby.mdx'
  },
  go: {
    repo: 'browserbase/stagehand-go',
    title: 'Go SDK',
    description: 'Official Stagehand SDK for Go',
    outputPath: 'v3/sdk/go.mdx'
  }
};

/**
 * Fetch content from a URL
 */
function fetchUrl(url) {
  return new Promise((resolve, reject) => {
    https.get(url, {
      headers: {
        'User-Agent': 'Stagehand-Docs-Sync'
      }
    }, (res) => {
      // Handle redirects
      if (res.statusCode === 301 || res.statusCode === 302) {
        fetchUrl(res.headers.location).then(resolve).catch(reject);
        return;
      }
      
      if (res.statusCode !== 200) {
        reject(new Error(`HTTP ${res.statusCode}: ${url}`));
        return;
      }
      
      let data = '';
      res.on('data', chunk => data += chunk);
      res.on('end', () => resolve(data));
      res.on('error', reject);
    }).on('error', reject);
  });
}

/**
 * Process README content for MDX compatibility
 */
function processReadmeContent(content, config) {
  let processed = content;
  
  // Remove HTML comments
  processed = processed.replace(/<!--[\s\S]*?-->/g, '');
  
  // Remove entire HTML blocks with picture/source tags (badge sections)
  processed = processed.replace(/<div[^>]*>[\s\S]*?<\/div>/gi, '');
  processed = processed.replace(/<p[^>]*align[^>]*>[\s\S]*?<\/p>/gi, '');
  processed = processed.replace(/<picture>[\s\S]*?<\/picture>/gi, '');
  
  // Remove standalone HTML tags
  processed = processed.replace(/<a[^>]*>[\s]*<img[^>]*>[\s]*<\/a>/gi, '');
  processed = processed.replace(/<img[^>]*badge[^>]*>/gi, '');
  processed = processed.replace(/<img[^>]*shields\.io[^>]*>/gi, '');
  processed = processed.replace(/<a[^>]*>\s*<picture>[\s\S]*?<\/picture>\s*<\/a>/gi, '');
  
  // Remove badge images in markdown format
  processed = processed.replace(/^\s*(\[!\[.*?\]\(.*?\)\]\(.*?\)\s*)+/gm, '');
  processed = processed.replace(/^\s*!\[.*?\]\(https:\/\/.*?badge.*?\)\s*/gm, '');
  processed = processed.replace(/\[!\[.*?\]\(.*?badge.*?\)\]\(.*?\)/g, '');
  
  // Remove standalone anchor img tags
  processed = processed.replace(/<a[^>]*href[^>]*><img[^>]*><\/a>/gi, '');
  
  // Clean up <code> tags with backticks inside (common in Go docs)
  processed = processed.replace(/<code>\\`([^`]*?)\\`<\/code>/g, '`$1`');
  processed = processed.replace(/<code>`([^`]*?)`<\/code>/g, '`$1`');
  processed = processed.replace(/<code>([^<]*?)<\/code>/g, '`$1`');
  
  // Fix malformed links with parentheses in URL (Go docs issue)
  processed = processed.replace(/\[([^\]]+)\]\(([^)]+)\(([^)]+)\)([^)]*)\)/g, '[$1]($2)');
  
  // Convert relative links to absolute GitHub links
  const repoUrl = `https://github.com/${config.repo}`;
  processed = processed.replace(/\]\((?!http)(?!#)(?!mailto)([^)]+)\)/g, `](${repoUrl}/blob/main/$1)`);
  
  // Fix code block language hints for MDX
  processed = processed.replace(/```kotlin/g, '```java');
  
  // Remove the first H1 if it exists (we'll add our own title)
  processed = processed.replace(/^#\s+.*\n+/, '');
  
  // Clean up excessive newlines
  processed = processed.replace(/\n{4,}/g, '\n\n\n');
  
  // Remove any remaining inline HTML img tags
  processed = processed.replace(/<img[^>]*>/gi, '');
  
  // Remove any remaining <a> tags that are empty or just whitespace
  processed = processed.replace(/<a[^>]*>\s*<\/a>/gi, '');
  
  // Clean up lines that are just whitespace
  processed = processed.replace(/^\s+$/gm, '');
  
  return processed.trim();
}

/**
 * Generate MDX frontmatter
 */
function generateFrontmatter(config) {
  return `---
title: "${config.title}"
description: "${config.description}"
---

<Note>
  This documentation is automatically synced from the [${config.title} GitHub repository](https://github.com/${config.repo}).
</Note>

`;
}

/**
 * Sync a single SDK's documentation
 */
async function syncSdk(language, config) {
  const rawUrl = `https://raw.githubusercontent.com/${config.repo}/main/README.md`;
  
  console.log(`Fetching ${language} SDK docs from ${rawUrl}...`);
  
  try {
    const readme = await fetchUrl(rawUrl);
    const processedContent = processReadmeContent(readme, config);
    const frontmatter = generateFrontmatter(config);
    const mdxContent = frontmatter + processedContent;
    
    // Ensure directory exists
    const outputDir = path.dirname(`${currentDir}/../${config.outputPath}`);
    if (!fs.existsSync(outputDir)) {
      fs.mkdirSync(outputDir, { recursive: true });
    }
    
    // Write MDX file
    const outputFile = `${currentDir}/../${config.outputPath}`;
    fs.writeFileSync(outputFile, mdxContent, 'utf8');
    
    console.log(`✓ ${language} SDK docs written to ${config.outputPath}`);
    return true;
  } catch (error) {
    console.error(`✗ Failed to sync ${language} SDK: ${error.message}`);
    return false;
  }
}

/**
 * Main function
 */
async function main() {
  console.log('Syncing SDK documentation from GitHub...\n');
  
  const results = await Promise.all(
    Object.entries(SDK_REPOS).map(([lang, config]) => syncSdk(lang, config))
  );
  
  const successCount = results.filter(Boolean).length;
  const totalCount = results.length;
  
  console.log(`\nDone! ${successCount}/${totalCount} SDKs synced successfully.`);
  
  if (successCount < totalCount) {
    process.exit(1);
  }
}

main().catch(error => {
  console.error('Fatal error:', error);
  process.exit(1);
});


================================================
FILE: packages/docs/snippets/excalidraw.mdx
================================================
export const Excalidraw = ({ url, className = "w-full" }) => {
	return (
		<>
			<div className="dark:hidden" >
				<iframe
					src={url + `?darkMode=false`}
					className={className}
					allowFullScreen
				></iframe>
			</div>

			<div className="hidden dark:block">
				<iframe
					src={url + `?darkMode=true`}
					className={className}
					allowFullScreen
				></iframe>
			</div>
		</>
	)
}

================================================
FILE: packages/docs/snippets/v3-banner.mdx
================================================
{/* 
  V3Banner - Currently a no-op component
  
  This component is imported across 50+ pages in v3 docs.
  Keeping it as a no-op rather than removing allows us to easily 
  add a new banner message in the future without editing every file.
  
  To add a banner, replace the null return with your JSX content.
*/}
export const V3Banner = () => null;


================================================
FILE: packages/docs/v2/basics/act.mdx
================================================
---
title: Act
description: 'Interact with a web page'
---

## What is `act()`?
``` typescript
page.act("click on add to cart")
```
`act` enables Stagehand to perform **individual** actions on a web page. Use it to build self-healing and deterministic automations that adapt to website changes. 

## Why use `act()`?

<CardGroup cols={2}>
  <Card title="Natural Language Instructions" icon="wand-magic-sparkles" href="#using-act">
    Write automation in plain English. No selectors or complex syntax.
  </Card>
  <Card title="Precise Control" icon="crosshairs" href="#best-practices">
    Build automations step by step. Define exactly what happens at every moment.
  </Card>
  <Card title="Self-Healing" icon="bandage" href="#ensure-reliable-actions">
    Actions automatically adapt when websites change.
  </Card>
  <Card title="Caching" icon="repeat" href="#reduce-model-costs">
    Cache actions to avoid LLM calls and ensure consistent execution across runs.
  </Card>
</CardGroup>

## Using `act()`

Use `act` to perform single actions in your automation. Here's how to click a button:

<CodeGroup>
```typescript TypeScript
await page.goto("https://example-store.com");
await page.act("click the add to cart button");
```

```python Python
await page.goto("https://example-store.com")
await page.act("click the add to cart button")
```
</CodeGroup>

With `act`, breaking complex actions into small, single-step actions works best. If you need to orchestrate multi-step flows, use multiple `act` commands or `agent`.

<Accordion title="Suggested actions">

| Action | Example instruction |
|--------|---------------------|
| Click | `click the button` |
| Fill | `fill the field with <value>` |
| Type | `type <text> into the search box` |
| Press | `press <key> in the search field` |
| Scroll | `scroll to <position>` |
| Select from dropdown | `select <value> from the dropdown` |
</Accordion>

<Tabs>
<Tab title="Do this">
Break your task into single-step actions.

<CodeGroup>
```typescript TypeScript
// Break it into single-step actions
await page.act("open the filters panel");
await page.act("choose 4-star rating");
await page.act("click the apply button");
```

```python Python
# Break it into single-step actions
await page.act("open the filters panel")
await page.act("choose 4-star rating")
await page.act("click the apply button")
```
</CodeGroup>
</Tab>

<Tab title="Don't do this">
For multi-step tasks, use [`agent()`](/v2/basics/agent) instead.

<CodeGroup>
```typescript TypeScript
// Too complex - trying to do multiple things at once
await page.act("open the filters panel, choose 4-star rating, and click apply");
```

```python Python
# Too complex - trying to do multiple things at once
await page.act("open the filters panel, choose 4-star rating, and click apply")
```
</CodeGroup>
</Tab>
</Tabs>

### Advanced Configuration

For advanced scenarios, you can configure additional options:

<CodeGroup>
```typescript TypeScript
// Dynamic food search with advanced options
const foodItem = "organic quinoa";

await page.act({
  action: "Type %foodItem% in the search box and press enter",
  variables: {
    foodItem: foodItem
  },
  modelName: "google/gemini-2.5-pro",
  modelClientOptions: {
    modelApiKey: process.env.GOOGLE_API_KEY,
  },
  iframes: true, // Search within iframes if needed
  domSettleTimeoutMs: 45000, // Wait longer for dynamic content
  timeoutMs: 60000 // Extended timeout for slow-loading forms
});
```

```python Python
# Dynamic food search with advanced options
food_item = "organic quinoa"

await page.act({
  "action": "Type %foodItem% in the search box and press enter",
  "variables": {
    "foodItem": food_item
  },
  "modelName": "google/gemini-2.5-pro",
  "modelClientOptions": {
    "modelApiKey": os.environ.get("GOOGLE_API_KEY")
  },
  "iframes": True, # Search within iframes if needed
  "domSettleTimeoutMs": 45000, # Wait longer for dynamic content
  "timeoutMs": 60000 # Extended timeout for slow-loading forms
})
```
</CodeGroup>
  
<Note>
Shadow DOM support is now available! Set `experimental: true` in your Stagehand configuration to enable it. See the [configuration guide](/v2/configuration/browser) for more details.
</Note>


## Best practices

### Ensure reliable actions

Use `observe()` to discover candidate actions on the current page and plan reliably. It returns a list of suggested actions (with selector, description, method, and arguments). You can pass an observed action directly to `act` to execute it.

<CodeGroup>
```typescript TypeScript
const [action] = await page.observe("click the login button");

if (action) {
  await page.act(action);
}
```

```python Python
results = await page.observe("click the login button")

if results:
    await page.act(results[0])
```
</CodeGroup>

<Card title="Analyze pages with observe()" icon="magnifying-glass" iconType="sharp-solid" href="/v2/basics/observe">
  Plan actions with `observe()` before executing with `act`.
</Card>

### Reduce model costs

Cache observed actions to avoid repeated LLM calls and ensure consistent execution.

<CodeGroup>
```typescript TypeScript
// Cost-optimized actions with caching
const actionCache = new Map();

const getCachedAction = async (instruction: string) => {
  if (actionCache.has(instruction)) {
    return actionCache.get(instruction);
  }
  
  const [action] = await page.observe(instruction);
  actionCache.set(instruction, action);
  return action;
};

// Reuse cached actions
const loginAction = await getCachedAction("click the login button");
await page.act(loginAction);
```

```python Python
# Cost-optimized actions with caching
action_cache = {}

async def get_cached_action(instruction: str):
    if instruction in action_cache:
        return action_cache[instruction]
    
    results = await page.observe(instruction)
    if results:
        action = results[0]
        action_cache[instruction] = action
        return action
    
    return None

# Reuse cached actions
login_action = await get_cached_action("click the login button")
if login_action:
    await page.act(login_action)
```
</CodeGroup>

<Card title="Complete caching guide" icon="database" iconType="sharp-solid" href="/v2/best-practices/caching">
  Learn advanced caching techniques and patterns for optimal performance.
</Card>

### Secure your automations

Variables will not be shared with LLM providers. Use them for passwords, API keys, and other sensitive data.


<Note>
Load sensitive data from environment variables using `.env` files. Never hardcode API keys, passwords, or other secrets directly in your code.
</Note>

<CodeGroup>
```typescript TypeScript
await page.act({
  action: "enter %username% in the email field",
  variables: {
    username: "user@example.com"
  }
});

await page.act({
  action: "enter %password% in the password field",
  variables: {
    password: process.env.USER_PASSWORD
  }
});
```

```python Python
# If using Python, set `use_api: true` in your Stagehand configuration

await page.act(
  "enter %username% in the email field",
  variables={
      "username": "user@example.com"
  }
)

await page.act(
  "enter %password% in the password field",
  variables={
      "password": os.environ.get("USER_PASSWORD")
  }
)
```
</CodeGroup>

<Warning>
When handling sensitive data, set `verbose: 0` in your Stagehand configuration to prevent secrets from appearing in logs. See the [configuration guide](/v2/configuration/browser) for more details.
</Warning>

<Card title="User Data Best Practices" icon="shield-check" iconType="sharp-solid" href="/v2/best-practices/user-data">
  Complete guide to securing your browser automations with best practices and configurations.
</Card>

## Troubleshooting

<AccordionGroup>


<Accordion title="Method not supported">
**Problem**: `act` fails with "method not supported" error

**Solutions**:
- Use clear and detailed instructions for what you want to accomplish
- Review our [evals](https://stagehand.dev/evals) to find the best models for your use case
- Use [`observe()`](/v2/basics/observe) and verify the resulting action is within a list of expected actions

**Solution 1: Validate with observe**

<CodeGroup>
```typescript TypeScript
const prompt = "click the submit button";
const expectedMethod = "click";

try {
  await page.act(prompt);
} catch (error) {
  if (error.message.includes("method not supported")) {
    // Observe the same prompt to get the planned action
    const [action] = await page.observe(prompt);
    
    if (action && action.method === expectedMethod) {
      await page.act(action);
    } else {
      throw new Error(`Unsupported method: expected "${expectedMethod}", got "${action?.method}"`);
    }
  } else {
    throw error;
  }
}
```

```python Python
prompt = "click the submit button"
expected_method = "click"

try:
    await page.act(prompt)
except Exception as error:
    if "method not supported" in str(error):
        # Observe the same prompt to get the planned action
        results = await page.observe(prompt)
        
        if results and results[0].method == expected_method:
            await page.act(results[0])
        else:
            method = results[0].method if results else "unknown"
            raise Exception(f'Unsupported method: expected "{expected_method}", got "{method}"')
    else:
        raise error
```
</CodeGroup>

**Solution 2: Retry with exponential backoff**

<CodeGroup>
```typescript TypeScript
// Retry with exponential backoff for intermittent issues
const prompt = "click the submit button";
const maxRetries = 3;

for (let attempt = 0; attempt <= maxRetries; attempt++) {
  try {
    await page.act(prompt, { timeoutMs: 10000 + (attempt * 5000) });
    break; // Success, exit retry loop
  } catch (error) {
    if (error.message.includes("method not supported") && attempt < maxRetries) {
      // Exponential backoff: wait 2^attempt seconds
      const delay = Math.pow(2, attempt) * 1000;
      console.log(`Retry ${attempt + 1}/${maxRetries} after ${delay}ms`);
      await new Promise(resolve => setTimeout(resolve, delay));
    } else {
      throw error;
    }
  }
}
```

```python Python
# Retry with exponential backoff for intermittent issues
import asyncio

prompt = "click the submit button"
max_retries = 3

for attempt in range(max_retries + 1):
    try:
        timeout = 10000 + (attempt * 5000)
        await page.act(prompt, {"timeoutMs": timeout})
        break  # Success, exit retry loop
    except Exception as error:
        if "method not supported" in str(error) and attempt < max_retries:
            # Exponential backoff: wait 2^attempt seconds
            delay = 2 ** attempt
            print(f"Retry {attempt + 1}/{max_retries} after {delay}s")
            await asyncio.sleep(delay)
        else:
            raise error
```
</CodeGroup>

</Accordion>

<Accordion title="Action failed or timed out">
**Problem**: `act` times out or fails to complete action (often due to element not found)

**Solutions**:
- Ensure page has fully loaded
- Check if content is in iframes: [Learn more about working with iframes](/v2/best-practices/working-with-iframes)
- Increase action timeout
- Use `observe()` first to verify element exists

<CodeGroup>
```typescript TypeScript
// Handle timeout and element not found issues
try {
  await page.act("click the submit button", { timeout: 30000 });
} catch (error) {
  // Check if page is fully loaded
  await page.waitForLoadState('domcontentloaded');
  
  // Use observe to check element state
  const [element] = await page.observe("find the submit button");
  
  if (element) {
    console.log("Element found, trying more specific instruction");
    await page.act("click the submit button at the bottom of the form");
  } else {
    console.log("Element not found, trying alternative selector");
    await page.act("click the button with text 'Submit'");
  }
}
```

```python Python
# Handle timeout and element not found issues
try:
    await page.act("click the submit button", {"timeout": 30000})
except Exception as error:
    # Check if page is fully loaded
    await page.wait_for_load_state('domcontentloaded')
    
    # Use observe to check element state
    results = await page.observe("find the submit button")
    
    if results:
        print("Element found, trying more specific instruction")
        await page.act("click the submit button at the bottom of the form")
    else:
        print("Element not found, trying alternative selector")
        await page.act("click the button with text 'Submit'")
```
</CodeGroup>
</Accordion>

<Accordion title="Incorrect element selected">
**Problem**: `act` performs action on wrong element

**Solutions**:
- Be more specific in instructions: include visual cues, position, or context
- Use `observe()` to preview which element will be selected
- Add contextual information: "the search button in the header"
- Use unique identifiers when available

<CodeGroup>
```typescript TypeScript
// More precise element targeting
// Instead of:
await page.act("click the button");

// Use specific context:
await page.act("click the red 'Delete' button next to the user John Smith");

// Or preview with observe first:
const [action] = await page.observe("click the submit button in the checkout form");
if (action.description.includes("checkout")) {
  await page.act(action);
}
```

```python Python
# More precise element targeting
# Instead of:
await page.act("click the button")

# Use specific context:
await page.act("click the red 'Delete' button next to the user John Smith")

# Or preview with observe first:
results = await page.observe("click the submit button in the checkout form")
if results and "checkout" in results[0].description:
    await page.act(results[0])
```
</CodeGroup>
</Accordion>


</AccordionGroup>

## Next steps

<CardGroup cols={2}>

  <Card title="Orchestrate complex workflows with Agent" icon="robot" iconType="sharp-solid" href="/v2/basics/agent">
    Use `Agent` to autonomously execute multi-step tasks and complex workflows.
  </Card>

   <Card title="Caching actions" icon="bolt" iconType="sharp-solid" href="/v2/best-practices/caching">
    Speed up repeated automations by caching actions.
  </Card>

  <Card title="Extract data with extract()" icon="table" iconType="sharp-solid" href="/v2/basics/extract">
    Use `extract` with a data schema to pull clean, typed data from any page.
  </Card>

  <Card title="Working with iframes" icon="frame" iconType="sharp-solid" href="/v2/best-practices/working-with-iframes">
    Learn best practices for interacting with elements inside iframes.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/basics/agent.mdx
================================================
---
title: Agent
description: 'Automate complex workflows with AI powered browser agents'
---

## What is `agent()?`

``` typescript
agent.execute("apply for a job at browserbase")
```
`agent` turns high level tasks into **fully autonomous** browser workflows. You can customize the agent by specifying the LLM provider and model, setting custom instructions for behavior, and configuring max steps.

<img src="/images/agent.gif" alt="Agent" />

## Why use `agent()`?

<CardGroup cols={2}>
  <Card title="Multi-Step Workflows" icon="route" href="#agent-execution-configuration">
    Execute complex sequences automatically.
  </Card>
  <Card title="Visual Understanding" icon="eye" href="/v2/best-practices/computer-use">
    Sees and understands web interfaces like humans do using computer vision.
  </Card>
</CardGroup>


## Using `agent()`

There are two ways to create agents in Stagehand:

### Computer Use Agents

Use computer use agents with specialized models from OpenAI or Anthropic: 

<CodeGroup>
```typescript TypeScript
const agent = stagehand.agent({
  provider: "anthropic",
  model: "claude-sonnet-4-20250514",
  instructions: "You are a helpful assistant that can use a web browser.",
  options: {
    apiKey: process.env.ANTHROPIC_API_KEY,
  },
});
await agent.execute("apply for a job at Browserbase")
```

```python Python
agent = stagehand.agent(
    model="claude-sonnet-4-20250514",
    instructions="You are a helpful assistant that can use a web browser.",
    options={
        "api_key": os.getenv("ANTHROPIC_API_KEY"),
    },
)
await agent.execute("apply for a job at Browserbase")
```
</CodeGroup>

<Callout icon="code" color="#6ec202" iconType="regular">View or run the example template [here](https://www.browserbase.com/templates/gemini-cua)</Callout>

### Use Stagehand Agent with Any LLM

Use the agent without specifying a provider to utilize any model or LLM provider:

<Note>Non CUA agents are currently only supported in TypeScript</Note>

```typescript TypeScript
const agent = stagehand.agent();
await agent.execute("apply for a job at Browserbase")
```


## MCP Integrations

Agents can be enhanced with external tools and services through MCP (Model Context Protocol) integrations. This allows your agent to access external APIs and data sources beyond just browser interactions.

<CodeGroup>
```typescript TypeScript (Pass URL)
const agent = stagehand.agent({
  provider: "openai",
  model: "computer-use-preview",
  integrations: [
    `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
  ],
  instructions: `You have access to web search through Exa. Use it to find current information before browsing.`,
  options: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});

await agent.execute("Search for the best headphones of 2025 and go through checkout for the top recommendation");
```

```typescript TypeScript (Create Connection)
import { connectToMCPServer } from "@browserbasehq/stagehand";

const supabaseClient = await connectToMCPServer(
  `https://server.smithery.ai/@supabase-community/supabase-mcp/mcp?api_key=${process.env.SMITHERY_API_KEY}`
);

const agent = stagehand.agent({
  provider: "openai",
  model: "computer-use-preview",
  integrations: [supabaseClient],
  instructions: `You can interact with Supabase databases. Use these tools to store and retrieve data.`,
  options: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});

await agent.execute("Search for restaurants and save the first result to the database");
```
</CodeGroup>

<Tip>
MCP integrations enable agents to be more powerful by combining browser automation with external APIs, databases, and services. The agent can intelligently decide when to use browser actions versus external tools.
</Tip>

<Warning>
Stagehand uses a 1288x711 viewport by default (the optimal size for Computer Use Agents). Other viewport sizes may reduce performance. If you need to modify the viewport, you can edit in the [Browser Configuration](/v2/configuration/browser).
</Warning>


## Available Models

Use specialized computer use models (e.g., `computer-use-preview` from OpenAI or `claude-sonnet-4-20250514` from Anthropic)

<Card title="Available Models" icon="robot" href="/v2/configuration/models">
  Check out the guide on how to use different models with Stagehand.
</Card>

## Agent Execution Configuration

Control the maximum number of steps the agent can take to complete the task using the `maxSteps` parameter.

<CodeGroup>
```typescript TypeScript
// Set maxSteps to control how many actions the agent can take
await agent.execute({
  instruction: "Sign me up for a library card",
  maxSteps: 15 // Agent will stop after 15 steps if task isn't complete
});
```

```python Python
# Set max_steps to control how many actions the agent can take
result = await agent.execute({
    "instruction": "Sign me up for a library card",
    "max_steps": 15  # Agent will stop after 15 steps if task isn't complete
})
```
</CodeGroup>

For complex tasks, increase the `maxSteps` limit and check task success.

<CodeGroup>
```typescript TypeScript
// Complex multi-step task requiring more actions
const result = await agent.execute({
  instruction: "Find and apply for software engineering jobs, filtering by remote work and saving 3 applications",
  maxSteps: 30, // Higher limit for complex workflows
});

// Check if the task completed successfully
if (result.success === true) {
  console.log("Task completed successfully!");
} else {
  console.log("Task failed or was incomplete");
}
```

```python Python
# Complex multi-step task requiring more actions
result = await agent.execute({
    "instruction": "Find and apply for software engineering jobs, filtering by remote work and saving 3 applications",
    "max_steps": 30  # Higher limit for complex workflows
})

# Check if the task completed successfully
if result.success == True:
    print("Task completed successfully!")
else:
    print("Task failed or was incomplete")
```
</CodeGroup>

## Best Practices

Following these best practices will improve your agent's success rate, reduce execution time, and minimize unexpected errors during task completion.

### Start on the Right Page
Navigate to your target page before executing tasks:

<Tabs>
<Tab title="Do this">
<CodeGroup>
```typescript TypeScript
await page.goto('https://github.com/browserbase/stagehand');
await agent.execute('Get me the latest PR on the stagehand repo');
```

```python Python
await page.goto("https://github.com/browserbase/stagehand")
result = await agent.execute("Get me the latest PR on the stagehand repo")
```
</CodeGroup>
</Tab>

<Tab title="Don't do this">
<CodeGroup>
```typescript TypeScript
await agent.execute('Go to GitHub and find the latest PR on browserbase/stagehand');
```

```python Python
result = await agent.execute("Go to GitHub and find the latest PR on browserbase/stagehand")
```
</CodeGroup>
</Tab>
</Tabs>


### Be Specific
Provide detailed instructions for better results:

<Tabs>
<Tab title="Do this">
<CodeGroup>
```typescript TypeScript
await agent.execute("Find Italian restaurants in Brooklyn that are open after 10pm and have outdoor seating");
```

```python Python
result = await agent.execute("Find Italian restaurants in Brooklyn that are open after 10pm and have outdoor seating")
```
</CodeGroup>
</Tab>

<Tab title="Don't do this">
<CodeGroup>
```typescript TypeScript
await agent.execute("Find a restaurant");
```

```python Python
result = await agent.execute("Find a restaurant")
```
</CodeGroup>
</Tab>
</Tabs>

## Troubleshooting

<AccordionGroup>


<Accordion title="Agent is stopping before completing the task">
**Problem**: Agent stops before finishing the requested task

**Solutions**:
- Check if the agent is hitting the maxSteps limit (default is 20)
- Increase maxSteps for complex tasks: `maxSteps: 30` or higher
- Break very complex tasks into smaller sequential executions

```typescript
// Increase maxSteps for complex tasks
await agent.execute({
  instruction: "Complete the multi-page registration form with all required information",
  maxSteps: 40 // Increased limit for complex task
});

// Or break into smaller tasks with success checking
const firstResult = await agent.execute({
  instruction: "Fill out page 1 of the registration form", 
  maxSteps: 15
});

// Only proceed if the first task was successful
if (firstResult.success === true) {
  await agent.execute({
    instruction: "Navigate to page 2 and complete remaining fields",
    maxSteps: 15
  });
} else {
  console.log("First task failed, stopping execution");
}
```
</Accordion>

<Accordion title="Agent is failing to click the proper elements">
**Problem**: Agent clicks on wrong elements or fails to interact with the correct UI components

**Solutions**:
- Ensure proper viewport size: Stagehand uses `1288x711` by default (optimal for Computer Use models)
- Avoid changing viewport dimensions as other sizes may reduce performance
</Accordion>


</AccordionGroup>


## Next steps

<CardGroup cols={2}>
<Card title="Act" icon="play" href="/v2/basics/act">
  Execute actions efficiently using observe results
</Card>

<Card title="Extract" icon="download" href="/v2/basics/extract">
  Extract structured data from observed elements
</Card>
</CardGroup>

================================================
FILE: packages/docs/v2/basics/extract.mdx
================================================
---
title: Extract
description: Extract structured data from a webpage
---

## What is `extract()`?

```typescript
page.extract("extract the name of the repository");
```

`extract` grabs structured data from a webpage. You can define your schema with [zod](https://github.com/colinhacks/zod) (TypeScript) or [pydantic](https://github.com/pydantic/pydantic) (Python). If you do not want to define a schema, you can also call `extract` with just a [natural language prompt](#prompt-only-extraction), or call `extract` [with no parameters](#extract-with-no-parameters).

## Why use `extract()`?

<CardGroup cols={2}>
  <Card title="Structured" icon="brackets-curly" href="#list-of-objects-extraction">
    Turn messy webpage data into clean objects that follow a schema.
  </Card>
  <Card title="Resilient" icon="dumbbell" href="#extract-with-context">
    Build resilient extractions that don't break when the website changes
  </Card>
</CardGroup>

<Note>
For TypeScript, the extract schemas are defined using zod schemas.

For Python, the extract schemas are defined using pydantic models.
</Note>

## Using `extract()`

### Single object Extraction

Here is how an `extract` call might look for a single object:

<CodeGroup>
```typescript TypeScript
import { z } from 'zod/v3';

const item = await page.extract({
  instruction: "extract the price of the item",
  schema: z.object({
    price: z.number(),
  }),
});
```

```python Python
from pydantic import BaseModel

class Extraction(BaseModel):
    price: float

item = await page.extract(
    "extract the price of the item", 
    schema=Extraction
)
```
</CodeGroup>

Your output schema will look like:
```Example
{ price: number }
```

### List of objects Extraction

Here is how an `extract` call might look for a list of objects.

<CodeGroup>
```typescript TypeScript
import { z } from 'zod/v3';

const apartments = await page.extract({
  instruction:
    "Extract ALL the apartment listings and their details, including address, price, and square feet.",
  schema: z.object({
    list_of_apartments: z.array(
      z.object({
        address: z.string(),
        price: z.string(),
        square_feet: z.string(),
      }),
    ),
  })
})

console.log("the apartment list is: ", apartments);
```

```python Python
from pydantic import BaseModel

class Apartment(BaseModel):
    address: str
    price: str
    square_feet: str

class Apartments(BaseModel):
    list_of_apartments: list[Apartment]

apartments = await page.extract(
    "Extract ALL the apartment listings and their details as a list, including address, price, and square feet for each apartment",
    schema=Apartments
)

print("the apartment list is: ", apartments)
```
</CodeGroup>

Your output schema will look like:
```Example
list_of_apartments: [
    {
      address: "street address here",
      price: "$1234.00",
      square_feet: "700"
    },
    {
        address: "another address here",
        price: "1010.00",
        square_feet: "500"
    },
    ...
]
```

### Prompt-only Extraction

You can call `extract` with just a natural language prompt:

<CodeGroup>
```typescript TypeScript
const result = await page.extract("extract the name of the repository");
```

```python Python
result = await page.extract("extract the name of the repository")
```
</CodeGroup>

When you call `extract` with just a prompt, your output schema will look like:
```Example
{ extraction: string }
```

### Extract with no parameters

Here is how you can call `extract` with no parameters.

<CodeGroup>
```typescript TypeScript
const pageText = await page.extract();
```

```python Python
pageText = await page.extract()
```
</CodeGroup>

Output schema:
```Example
{ pageText: string }
```

Calling `extract` with no parameters will return hierarchical tree representation of the root DOM. This will not be passed through an LLM. It will look something like this:

```
Accessibility Tree:
[0-2] RootWebArea: What is Stagehand? - 🤘 Stagehand
  [0-37] scrollable
    [0-118] body
      [0-241] scrollable
        [0-242] div
          [0-244] link: 🤘 Stagehand home page light logo
            [0-245] span
              [0-246] StaticText: 🤘 Stagehand
              [0-247] StaticText: home page
```

## Best practices


### Extract with Context

You can provide additional context to your schema to help the model extract the data more accurately.

<CodeGroup>
```typescript TypeScript
import { z } from 'zod/v3';

const apartments = await page.extract({
 instruction:
   "Extract ALL the apartment listings and their details, including address, price, and square feet.",
 schema: z.object({
   list_of_apartments: z.array(
     z.object({
       address: z.string().describe("the address of the apartment"),
       price: z.string().describe("the price of the apartment"),
       square_feet: z.string().describe("the square footage of the apartment"),
     }),
   ),
 })
})
```

```python Python
from pydantic import BaseModel, Field

class Apartment(BaseModel):
    address: str = Field(..., description="the address of the apartment")
    price: str = Field(..., description="the price of the apartment")
    square_feet: str = Field(..., description="the square footage of the apartment")

class Apartments(BaseModel):
    list_of_apartments: list[Apartment]

apartments = await page.extract(
    "Extract ALL the apartment listings and their details as a list. For each apartment, include: the address of the apartment, the price of the apartment, and the square footage of the apartment",
    schema=Apartments
)
```
</CodeGroup>

### Link Extraction
<Note>
To extract links or URLs, in the TypeScript version of Stagehand, you'll need to define the relevant field as `z.string().url()`.
In Python, you'll need to define it as `HttpUrl`.
</Note>

Here is how an `extract` call might look for extracting a link or URL. This also works for image links.

<CodeGroup>
```typescript TypeScript
import { z } from 'zod/v3';

const extraction = await page.extract({
  instruction: "extract the link to the 'contact us' page",
  schema: z.object({
    link: z.string().url(), // note the usage of z.string().url() here
  }),
});

console.log("the link to the contact us page is: ", extraction.link);
```

```python Python
from pydantic import BaseModel, HttpUrl

class Extraction(BaseModel):
    link: HttpUrl # note the usage of HttpUrl here

extraction = await page.extract(
    "extract the link to the 'contact us' page", 
    schema=Extraction
)

print("the link to the contact us page is: ", extraction.link)
```
</CodeGroup>

<Tip>
Inside Stagehand, extracting links works by asking the LLM to select an ID. Stagehand looks up that ID in a mapping of IDs -> URLs. When logging the LLM trace, you should expect to see IDs. The actual URLs will be included in the final `ExtractResult`.
</Tip>

## Troubleshooting

<AccordionGroup>
<Accordion title="Empty or partial results">
**Problem**: `extract()` returns empty or incomplete data

**Solutions**:
- **Check your instruction clarity**: Make sure your instruction is specific and describes exactly what data you want to extract
- **Verify the data exists**: Use `page.observe()` first to confirm the data is present on the page
- **Wait for dynamic content**: If the page loads content dynamically, use `page.act("wait for the content to load")` before extracting

**Solution: Wait for content before extracting**
<CodeGroup>
```typescript TypeScript
// Wait for content before extracting
await page.act("wait for the product listings to load");
const products = await page.extract({
  instruction: "extract all product names and prices",
  schema: z.object({
    products: z.array(z.object({
      name: z.string(),
      price: z.string()
    }))
  })
});
```

```python Python
# Wait for content before extracting
await page.act("wait for the product listings to load")
products = await page.extract(
    "extract all product names and prices",
    schema=ProductList
)
```
</CodeGroup>
</Accordion>

<Accordion title="Schema validation errors">
**Problem**: Getting schema validation errors or type mismatches

**Solutions**:
- **Use optional fields**: Make fields optional with `z.optional()` (TypeScript) or `Optional[type]` (Python) if the data might not always be present
- **Use flexible types**: Consider using `z.string()` instead of `z.number()` for prices that might include currency symbols
- **Add descriptions**: Use `.describe()` (TypeScript) or `Field(description="...")` (Python) to help the model understand field requirements

**Solution: More flexible schema**
<CodeGroup>
```typescript TypeScript
const schema = z.object({
  price: z.string().describe("price including currency symbol, e.g., '$19.99'"),
  availability: z.string().optional().describe("stock status if available"),
  rating: z.number().optional()
});
```

```python Python
class FlexibleProduct(BaseModel):
    price: str = Field(description="price including currency symbol, e.g., '$19.99'")
    availability: Optional[str] = Field(default=None, description="stock status if available")
    rating: Optional[float] = None
```
</CodeGroup>
</Accordion>

<Accordion title="Inconsistent results">
**Problem**: Extraction results vary between runs

**Solutions**:
- **Be more specific in instructions**: Instead of "extract prices", use "extract the numerical price value for each item"
- **Use context in schema descriptions**: Add field descriptions to guide the model
- **Combine with observe**: Use `page.observe()` to understand the page structure first

**Solution: Validate with observe first**
<CodeGroup>
```typescript TypeScript
// First observe to understand the page structure
const elements = await page.observe("find all product listings");
console.log("Found elements:", elements.map(e => e.description));

// Then extract with specific targeting
const products = await page.extract({
  instruction: "extract name and price from each product listing shown on the page",
  schema: z.object({
    products: z.array(z.object({
      name: z.string().describe("the product title or name"),
      price: z.string().describe("the price as displayed, including currency")
    }))
  })
});
```

```python Python
# First observe to understand the page structure
elements = await page.observe("find all product listings")
print("Found elements:", [e.description for e in elements])

# Then extract with specific targeting
products = await page.extract(
    "extract name and price from each product listing shown on the page",
    schema=ProductSchema
)
```
</CodeGroup>
</Accordion>

<Accordion title="Performance issues">
**Problem**: Extraction is slow or timing out

**Solutions**:
- **Reduce scope**: Extract smaller chunks of data in multiple calls rather than everything at once
- **Use targeted instructions**: Be specific about which part of the page to focus on
- **Consider pagination**: For large datasets, extract one page at a time
- **Increase timeout**: Use `timeoutMs` parameter for complex extractions

**Solution: Break down large extractions**
<CodeGroup>
```typescript TypeScript
// Instead of extracting everything at once
const allData = [];
const pageNumbers = [1, 2, 3, 4, 5];

for (const pageNum of pageNumbers) {
  await page.act(`navigate to page ${pageNum}`);
  
  const pageData = await page.extract({
    instruction: "extract product data from the current page only",
    schema: ProductPageSchema,
    timeoutMs: 60000 // 60 second timeout
  });
  
  allData.push(...pageData.products);
}
```

```python Python
# Instead of extracting everything at once
all_data = []
page_numbers = [1, 2, 3, 4, 5]

for page_num in page_numbers:
    await page.act(f"navigate to page {page_num}")
    
    page_data = await page.extract(
        "extract product data from the current page only",
        schema=ProductPageSchema,
        timeout_ms=60000  # 60 second timeout
    )
    
    all_data.extend(page_data.products)
```
</CodeGroup>
</Accordion>
</AccordionGroup>

## Next steps

<CardGroup cols={2}>

  <Card title="Act" icon="play" href="/v2/basics/act">
    Execute actions efficiently using observe results
  </Card>

  <Card title="Observe" icon="magnifying-glass" href="/v2/basics/observe">
    Analyze pages with observe()
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/basics/observe.mdx
================================================
---
title: Observe
sidebarTitle: Observe
description: 'Find suggested actions for your workflows'
---

## What is `observe()`?
``` typescript
page.observe("Find the login button")
```

`observe` allows you to turn any page into a checklist of reliable, executable actions. It discovers key elements, ranks likely next steps, and returns structured actions (selector, method, args) you can run instantly with `act` or use to precisely target `extract` so workflows are faster, cheaper, and more resilient.

## Why use `observe()`?

<CardGroup cols={2}>
  <Card title="Explore" icon="compass" href="/v2/basics/observe#observe-with-act">
    When you're unsure what's on a page or need to discover available actions
  </Card>
  <Card title="Plan" icon="map" href="/v2/basics/observe#plan-ahead">
    When building complex workflows, plan ahead all the actions you'll need to take
  </Card>
  <Card title="Cache" icon="database" href="/v2/best-practices/caching">
    When you want to remember actions for the future and avoid LLM calls
  </Card>
    <Card title="Validate" icon="check" href="/v2/basics/observe#observe-with-act">
    Before performing critical actions to ensure elements exist
  </Card>
</CardGroup>

## Using `observe()`

Calling `observe` supercharges other Stagehand methods. Use it to plan workflows, speed up `act`, and precisely target `extract`. Using `observe` helps you explore what's possible on a page by giving you a list of suggested actions.

<CodeGroup>
```typescript TypeScript
// Plan & validate
const buttons = await page.observe("Find the log in / sign up buttons");
```
```python Python
# Plan & validate
buttons = await page.observe("Find the log in / sign up buttons")
```
</CodeGroup>

This will return a list of suggestions with the following structure
```json
{
  "selector": "xpath=/html/body/header/div/button[1]",
  "description": "Log in button in the top right corner",
  "method": "click",
  "arguments": []
}
```

### Observe with Act

You can **validate** the action (method, selector, arguments...) and then pass it to `act` to **avoid extra LLM inference**.

<Note>
**Performance Tip**: Acting on multiple `observe` suggestions will minimize the number of LLM calls for multi-step actions and speed up your workflow 2-3x.
</Note>

<CodeGroup>
```typescript TypeScript
await page.act(buttons[0]); // No LLM!
```
```python Python
await page.act(buttons[0]) # No LLM!
```
</CodeGroup>

#### Plan ahead

You can use multiple suggestions from `observe` to preview a batch of actions. For example, when filling a form you could ask `observe` to find all the fields and then pass them in to `act`. **Call the LLM once, act multiple times**.

<CodeGroup>
```typescript TypeScript
const fields = await page.observe("Find all the fields in the form");
for (const field of fields) {
  await page.act(field); // No LLM!
}
```
```python Python
fields = await page.observe("Find all the fields in the form")
for field in fields:
  await page.act(field) # No LLM!
```
</CodeGroup>

### Observe and Extract

Using `observe` to focus `extract` on a specific section of the page (like a table, a form, a list...) minimizes the context needed for an extraction. 
<Tip>
**Savings Tip**: Pass the selector to `extract` to reduce LLM token usage by 10x for verbose websites!
</Tip>

<CodeGroup>
```typescript TypeScript
// Use observe to validate elements before extraction
const [ table ] = await page.observe("Find the data table");

const { data } = await page.extract({
  instruction: "Extract data from the table",
  schema: z.object({
    data: z.string()
  }),
  selector: table.selector // Reduce context scope needed for extraction
});
```
```python Python
# Use observe to validate elements before extraction
[ table ] = await page.observe("Find the data table")

extraction = await page.extract(
  "Extract data from the table",
  schema=Data, # Pydantic schema
  selector=table.selector # Reduce context scope needed for extraction
)
```
</CodeGroup>

## Best Practices

### Choose the right commands

<Tabs>
<Tab title="Do this">

- Use `observe` when a yes/no answer will gate an action (e.g., "Find the Submit button"), then conditionally `act`.
- Use `extract` for information-only questions (e.g., "What’s the page title?", "How many results are listed?").

</Tab>

<Tab title="Don't do this">

- Don’t call `extract` to locate elements you plan to click next.
- Don’t call `observe` to answer info-only questions that won’t lead to an action.

</Tab>
</Tabs>
- **Discover and plan with `observe`**: Use `observe("Find…")` to map actionable elements and preview next steps.
- **Scope `extract` with selectors from `observe`**: First `observe("Find the data table")`, then pass `selector` to `extract` to reduce tokens and boost accuracy.

### Conserve LLM tokens

Optimize performance by directly passing `ObserveResult` to `act` (e.g., `await page.act(results[0])`) to save LLM tokens. Batch operations by using `observe` once to find elements, then act on each. Cache and reuse stable `observe` results for familiar pages, using self-healing if layouts change.

<Card title="Build your own cache" icon="database" href="/v2/best-practices/caching">
  Check out the guide on how to build your own action cache
</Card>

### Improve Accuracy

Be precise with instructions, e.g., "Find the primary CTA in the hero" for better results. For iframes, set `iframes: true` and wait for `networkidle`. Use `observe` selectors in `extract` to limit context.

<Card title="Prompting Best Practices" icon="robot" href="/v2/best-practices/prompting-best-practices">
  Check out the guide on how to improve the accuracy of your results
</Card>

### Action Validation

Before performing critical actions, validate the suggestion's `method`, `selector`, and `arguments` to prevent misclicks. If a direct `act` fails, use `observe` with the same prompt to verify the method, then proceed with the suggested action.

<CodeGroup>
```typescript TypeScript
const prompt = "click the submit button";
const expectedMethod = "click";

try {
  await page.act(prompt);
} catch (error) {
  if (error.message.includes("method not supported")) {
    // Observe the same prompt to get the planned action
    const [action] = await page.observe(prompt);
    
    if (action && action.method === expectedMethod) {
      await page.act(action);
    } else {
      throw new Error(`Unsupported method: expected "${expectedMethod}", got "${action?.method}"`);
    }
  } else {
    throw error;
  }
}
```

```python Python
prompt = "click the submit button"
expected_method = "click"

try:
    await page.act(prompt)
except Exception as error:
    if "method not supported" in str(error):
        # Observe the same prompt to get the planned action
        results = await page.observe(prompt)
        
        if results and results[0].method == expected_method:
            await page.act(results[0])
        else:
            method = results[0].method if results else "unknown"
            raise Exception(f'Unsupported method: expected "{expected_method}", got "{method}"')
    else:
        raise error
```
</CodeGroup>

## Troubleshooting

<AccordionGroup>
<Accordion title="No elements found">
**Problem**: `observe` returns empty array

**Solutions**:
- Make sure the element exists on the page
- Use explicit instructions to find the element
- Ensure page has fully loaded
- Look at the [debugging logs](/v2/configuration/logging), if the element is there then the LLM might be hallucinating/not catching it. 
</Accordion>

<Accordion title="Inaccurate element descriptions">
**Problem**: Descriptions don't match actual elements

**Solutions**:
- Use more capable models: check [evals](https://stagehand.dev/evals) for the best models for your use case
- Provide more specific instructions
- Log inference to file (see [debugging logs](/v2/configuration/logging#llm-inference-logging)) to get an LLM trace

</Accordion>
<Accordion title="Wrong method identified">
**Problem**: The method identified is not valid

**Solutions**:
- Check the [supported actions](/v2/basics/act)
- Provide more specific instructions
- Validate the method, if invalid override with one of the supported ones

</Accordion>
</AccordionGroup>


## Next Steps

<CardGroup cols={2}>
<Card title="Act Overview" icon="play" href="/v2/basics/act">
Execute actions efficiently using `observe` results
</Card>

<Card title="Extract Data" icon="download" href="/v2/basics/extract">  
Extract structured data from observed elements
</Card>

<Card title="Observability" icon="chart-line" href="/v2/configuration/observability">
Monitor and debug observation performance  
</Card>

<Card title="Best Practices" icon="star" href="/v2/best-practices/prompting-best-practices">
Advanced patterns and optimization techniques
</Card>
</CardGroup>


================================================
FILE: packages/docs/v2/best-practices/agent-fallbacks.mdx
================================================
---
title: Agent Fallbacks
description: "A failsafe when unexpected page changes add extra steps"
---

## When to use

Use an agent fallback as a failsafe when a one step action unexpectedly becomes a multi-step flow.

## How it works

1. [`act()`](/v2/basics/act) is attempted for the direct action
2. If it fails, [`agent()`](/v2/basics/agent) figures out the new path
3. Agent completes all needed steps (open menu → click button)

### Example scenario

**Before**: Sign in button was in the header  
**After**: Sign in now requires: Click account menu → Click "Sign in" option

A single `act("click sign in")` can't handle this change. The agent fallback can discover and execute both steps.

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

try {
  await page.act("click the 'Sign In' button");
} catch (err) {
  console.log("Agent fallback triggered");

  const agent = stagehand.agent({
    provider: "anthropic",
    model: "claude-sonnet-4-20250514",
    instructions: "You are a helpful assistant that can use a web browser.",
  });

  const result = await agent.execute({
    instruction: "Find and click Sign In button",
    maxSteps: 10,
  });

  console.log(result.success ? "Agent fallback success" : "Agent fallback failed");

  if (!result.success) throw err;
}
```

```python Python
from stagehand import Stagehand

try:
    await page.act("click the 'Sign In' button")
except Exception as err:
    print("Agent fallback triggered")

    agent = stagehand.agent({
        "provider": "anthropic",
        "model": "claude-sonnet-4-20250514",
        "instructions": "Complete the action, handling any new steps required.",
    })

    result = await agent.execute({
        "instruction": "Find and click Sign In button",
        "max_steps": 10,
    })

    print("Agent fallback success" if result.success else "Agent fallback failed")

    if not result.success:
        raise err
```
</CodeGroup>


================================================
FILE: packages/docs/v2/best-practices/build-agent.mdx
================================================
---
title: 'Build a web browsing agent'
description: 'Build an AI agent that can autonomously control a browser with Stagehand'
---
import { Excalidraw } from '/snippets/excalidraw.mdx';

Stagehand gives AI agents powerful tools to control a browser completely autonomously. Watch below as a Stagehand agent autonomously navigates to a URL, takes actions on the page, and extracts structured data to answer a question.
There's quite a few ways to build an agent with Stagehand. Let's look at a few of them.

![Agent](/media/stagehand-agent.gif)

## Stagehand MCP

The above example is a Claude agent that uses Stagehand to control a browser. At this time of writing, [multimodal tool calling](https://sdk.vercel.ai/docs/ai-sdk-core/tools-and-tool-calling#multi-modal-tool-results) is only supported in Claude 3.5/3.7 Sonnet. 
This means Claude is intelligent enough to know when to request a browser screenshot, and it can then use that screenshot to make decisions about what actions to take next.

<CardGroup>
<Card title="Browserbase MCP" href="https://github.com/browserbase/mcp-server-browserbase/" icon="hand-horns">
Control a browser with Browserbase MCP powered by Stagehand
</Card>
</CardGroup>

What's really interesting about this is that the agent is able to reason about the browser state and take actions separate from one another! 
Claude is able to reason about the browser state, while Stagehand is able to take actions on the page with GPT-4o-mini or a computer use model.
Stagehand is even smart enough to know when to use GPT-4o-mini and when to use a computer use model, i.e. on iframe detection.

<Excalidraw className="w-full aspect-video" url="https://link.excalidraw.com/readonly/GWQWmWUBqMBEAamlWsIM?darkMode=true" />

We've found great success from having Claude as the "Trajectory" agent calling Stagehand tools when it sees fit! 
While MCP is really nascent, we're excited to see where it goes.

## Stagehand + Computer Use Models

Stagehand lets you leverage powerful computer use APIs from OpenAI and Anthropic with just one line of code. 

<CodeGroup>
```typescript TypeScript
await page.goto("https://github.com/browserbase/stagehand");

// Create a Computer Use agent with just one line of code!
const agent = stagehand.agent({
	provider: "openai",
	model: "computer-use-preview"
});

// Use the agent to execute a task
const result = await agent.execute("Extract the top contributor's username");
console.log(result);
```
```python Python
await page.goto("https://github.com/browserbase/stagehand-python")

# Create a Computer Use agent with just one line of code!
agent = stagehand.agent(
    model="computer-use-preview"
)

# Use the agent to execute a task
result = await agent.execute("Extract the top contributor's username")
print(result)
```
</CodeGroup>

<CardGroup>
<Card title="Stagehand + Computer Use Docs" href="/best-practices/computer-use" icon="scroll">
Check out our docs page for instructions on how to use computer use models with Stagehand.
</Card>
<Card title="CUA Browser Demo" href="https://cua.browserbase.com/" icon="brain-circuit">
Check out a live demo of a Browserbase browser controlled by OpenAI's Computer Using Agent (CUA) model.
</Card>
</CardGroup>

## Sequential Tool Calling (Open Operator)

In January 2025, Browserbase released [Open Operator](https://operator.browserbase.com). 
Open Operator is able to reason about the browser state and take actions accordingly to accomplish larger tasks like "order me a pizza".
It works by calling Stagehand tools in sequence:

1. If there's no URL, go to a default URL.
1. Examine the browser state. Ask an LLM to reason about what to do next.
1. Use `page.act()` to execute the LLM-suggested action.
1. Repeat

<Excalidraw className="w-full" url="https://link.excalidraw.com/readonly/dKh5sB1gEM1EjVqRCGKn" />

Incorporating `stagehand.agent` into your browser automation is as easy as adding a single line of code:

<Note>
Python currently supports `stagehand.agent` with Computer Use Agent (CUA) models. The default implementation is coming soon. 
</Note>

<CodeGroup>
```typescript TypeScript
await stagehand.page.goto("https://github.com/browserbase/stagehand");

// Open Operator will use the default LLM from Stagehand config
const operator = stagehand.agent();
const { message, actions } = await operator.execute(
	"Extract the top contributor's username"
);

console.log(message);
```
</CodeGroup>

### Replay the agent's actions

You can replay the agent's actions exactly the same way you would with a regular Stagehand agent. You can even automatically cache the actions to avoid unnecessary LLM calls on a repeated run.

Let's use the `replay` function below to save the actions to a Stagehand script file, which will reproduce the same actions the agent did, with cached actions built in.

<Accordion title="utils.ts">
```typescript
import { AgentAction, AgentResult } from "@browserbasehq/stagehand";
import { exec } from "child_process";
import fs from "fs/promises";

export async function replay(result: AgentResult) {
  const history = result.actions;
  const replay = history
    .map((action: AgentAction) => {
      switch (action.type) {
        case "act":
          if (!action.playwrightArguments) {
            throw new Error("No playwright arguments provided");
          }
          return `await page.act(${JSON.stringify(
            action.playwrightArguments
          )})`;
        case "extract":
          return `await page.extract("${action.parameters}")`;
        case "goto":
          return `await page.goto("${action.parameters}")`;
        case "wait":
          return `await page.waitForTimeout(${parseInt(
            action.parameters as string
          )})`;
        case "navback":
          return `await page.goBack()`;
        case "refresh":
          return `await page.reload()`;
        case "close":
          return `await stagehand.close()`;
        default:
          return `await stagehand.oops()`;
      }
    })
    .join("\n");

  console.log("Replay:");
  const boilerplate = `
import { Page, BrowserContext, Stagehand } from "@browserbasehq/stagehand";

export async function main(stagehand: Stagehand) {
    const page = stagehand.page
	${replay}
}
  `;
  await fs.writeFile("replay.ts", boilerplate);

  // Format the replay file with prettier
  await new Promise((resolve, reject) => {
    exec(
      "npx prettier --write replay.ts",
      (error: any, stdout: any, stderr: any) => {
        if (error) {
          console.error(`Error formatting replay.ts: ${error}`);
          reject(error);
          return;
        }
        resolve(stdout);
      }
    );
  });
}
```
</Accordion>

Here's the replay output of an instruction like `"Get me the stock price of NVDA"`:

```typescript {14-22} replay.ts
import { Page, BrowserContext, Stagehand } from "@browserbasehq/stagehand";

export async function main({
  page,
  context,
  stagehand,
}: {
  page: Page; // Playwright Page with act, extract, and observe methods
  context: BrowserContext; // Playwright BrowserContext
  stagehand: Stagehand; // Stagehand instance
}) {
  await page.goto("https://www.google.com");

  // Replay will default to Playwright first to avoid unnecessary LLM calls!
  // If the Playwright action fails, Stagehand AI will take over and self-heal
  await page.act({
    description: "The search combobox where users can type their queries.",
    method: "fill",
    arguments: ["NVDA stock price"],
    selector:
      "xpath=/html/body[1]/div[1]/div[3]/form[1]/div[1]/div[1]/div[1]/div[1]/div[2]/textarea[1]",
  });
  await page.extract(
    "the displayed NVDA stock price in the search suggestions",
  );
  await stagehand.close();
}
```

================================================
FILE: packages/docs/v2/best-practices/caching.mdx
================================================
---
title: Caching Actions
description: You can cache actions in Stagehand to avoid redundant LLM calls.
---

Caching actions in Stagehand is useful for actions that are expensive to run, or when the underlying DOM structure is not expected to change.

## Using `observe` to preview an action
`observe` lets you preview an action before taking it. If you are satisfied with the action preview, you can run it in `page.act` with no further LLM calls.

<CodeGroup>
```typescript TypeScript
const [actionPreview] = await page.observe("Click the quickstart link");

/** actionPreview is a JSON-ified version of a Playwright action:
{
	description: "The quickstart link",
	method: "click",
	selector: "/html/body/div[1]/div[1]/a",
	arguments: [],
}
**/

// NO LLM INFERENCE when calling act on the preview
await page.act(actionPreview)
```

```python Python
actions = await page.observe("Click the quickstart link")
action_preview = actions[0]

# action_preview is a dictionary version of a Playwright action:
# {
#	"description": "The quickstart link",
#	"method": "click",
#	"selector": "/html/body/div[1]/div[1]/a",
#	"arguments": [],
# }

# NO LLM INFERENCE when calling act on the preview
await page.act(action_preview)
```
</CodeGroup>

## Simple caching

Let's use a simple file-based cache for this example. We'll write a getter and a setter functions that can read and write to a JSON file:

<CodeGroup>
```typescript TypeScript
// Get the cached value (undefined if it doesn't exist)
async function getCache(key: string): Promise<ObserveResult | undefined> {
  try {
    const cache = await readFile("cache.json");
    const parsed = JSON.parse(cache);
    return parsed[key];
  } catch {
    return undefined;
  }
}

// Set the cache value
async function setCache(key: string, value: ObserveResult): Promise<void> {
  const cache = await readFile("cache.json");
  const parsed = JSON.parse(cache);
  parsed[key] = value;
  await writeFile("cache.json", JSON.stringify(parsed));
}
```

```python Python
# Get the cached value (None if it doesn't exist)
async def get_cache(key: str) -> Optional[Dict[str, Any]]:
    try:
        async with aiofiles.open("cache.json", 'r') as f:
            cache_content = await f.read()
            parsed = json.loads(cache_content)
            return parsed.get(key)
    except (FileNotFoundError, json.JSONDecodeError):
        return None

# Set the cache value
async def set_cache(key: str, value: Dict[str, Any]) -> None:
    try:
        async with aiofiles.open("cache.json", 'r') as f:
            cache_content = await f.read()
            parsed = json.loads(cache_content)
    except (FileNotFoundError, json.JSONDecodeError):
        parsed = {}
    
    parsed[key] = value
    
    async with aiofiles.open("cache.json", 'w') as f:
        await f.write(json.dumps(parsed))
```
</CodeGroup>

### Act with cache
Let's write a function that will check the cache, get the action, and run it. If the action fails, we'll attempt to "self-heal", i.e. retry it with `page.act` directly.

<CodeGroup>
```typescript TypeScript
// Check the cache, get the action, and run it
// If selfHeal is true, we'll attempt to self-heal if the action fails
async function actWithCache(page: Page, key: string, prompt: string, selfHeal = false) {
	try {
		const cacheExists = await getCache(key);

		let action: ObserveResult;
		if (cacheExists) {
		// Get the cached action
		action = await getCache(prompt);
		} else {
		// Get the observe result (the action)
		[action] = await page.observe(prompt);

		// Cache the action
		await setCache(prompt, action);
		}

		// Run the action (no LLM inference)
		await page.act(action);
	} catch (e) {
		console.error(e);
		// in selfHeal mode, we'll retry the action
		if (selfHeal) {
			console.log("Attempting to self-heal...");
			await page.act(prompt);
		}
		else {
			throw e;
		}
	}
}
```

```python Python
# Check the cache, get the action, and run it
# If self_heal is true, we'll attempt to self-heal if the action fails
async def act_with_cache(page, key: str, prompt: str, self_heal: bool = False):
    try:
        cache_exists = await get_cache(key)

        if cache_exists:
            # Get the cached action
            action = await get_cache(prompt)
        else:
            # Get the observe result (the action)
            actions = await page.observe(prompt)
            action = actions[0]

            # Cache the action
            await set_cache(prompt, action)

        # Run the action (no LLM inference)
        await page.act(action)
    except Exception as e:
        print(f"Error: {e}")
        # in self_heal mode, we'll retry the action
        if self_heal:
            print("Attempting to self-heal...")
            await page.act(prompt)
        else:
            raise e
```
</CodeGroup>

You can now use `actWithCache` to run an action with caching:

<CodeGroup>
```typescript TypeScript
const prompt = "Click the quickstart link";
const key = prompt; // Simple cache key
// Attempt cached action or self-heal
await actWithCache(page, key, prompt);
```

```python Python
prompt = "Click the quickstart link"
key = prompt  # Simple cache key
# Attempt cached action or self-heal
await act_with_cache(page, key, prompt)
```
</CodeGroup>

## Advanced caching

The above example is simple, but you may want to cache actions based on the page contents. Also, if you have duplicate prompts, you should use a more unique key.

We want to leave caching logic up to you, but give you all the tools you need to implement your own caching strategy.

You can directly access the DOM and accessibility tree from Playwright's page object. Here's an example of how to access the page content:

<CodeGroup>
```typescript TypeScript
// Get the page content
const pageContent = await page.content();
```

```python Python
# Get the page content
page_content = await page.content()
```
</CodeGroup>

You may also want to use the accessibility tree, the DOM, or any other information to create a more unique key. You can do this as you please, with very similar logic to the above example.

================================================
FILE: packages/docs/v2/best-practices/computer-use.mdx
================================================
---
title: Computer Use Agents
description: Incorporate Computer Use APIs from Anthropic and OpenAI with one line of code in Stagehand.
---

## What is a Computer Use Agent?

<iframe
  width="100%"
  height="400"
  src="https://www.youtube.com/embed/ODaHJzOyVCQ"
  title="YouTube video player"
  frameborder="0"
  allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
  allowfullscreen
></iframe>
You might've heard of [Claude Computer Use](https://www.anthropic.com/news/3-5-models-and-computer-use) or [OpenAI's Computer Using Agent](https://openai.com/index/computer-using-agent/).

These are powerful tools that can convert natural language into actions on the computer. However, you'd otherwise need to write your own code to convert these actions into Playwright commands.

Stagehand not only handles the execution of Computer Use outputs, but also lets you hot-swap between OpenAI and Anthropic models with one line of code.

## How to use a Computer Use Agent in Stagehand

Stagehand lets you use Computer Use Agents with one line of code:

<Note>
**IMPORTANT! Configure your browser dimensions**

Computer Use Agents will often return XY-coordinates to click on the screen, so you'll need to configure your browser dimensions.

If not specified, the default browser dimensions are 1024x768. You can also configure the browser dimensions in the `browserbaseSessionCreateParams` or `localBrowserLaunchOptions` options.
</Note>


### Configuring browser dimensions

Browser configuration differs by environment:

<Tabs>
<Tab title="BROWSERBASE">
<CodeGroup>  
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
	env: "BROWSERBASE",
  	apiKey: process.env.BROWSERBASE_API_KEY /* API key for authentication */,
    projectId: process.env.BROWSERBASE_PROJECT_ID /* Project identifier */,
  
    browserbaseSessionCreateParams: {
      projectId: process.env.BROWSERBASE_PROJECT_ID!,
      browserSettings: {
		blockAds: true,
        viewport: {
          width: 1024,
          height: 768,
        },
      },
  	},
});

await stagehand.init();
```
```python Python
import os
from stagehand import Stagehand, StagehandConfig

stagehand = Stagehand(StagehandConfig(
    env="BROWSERBASE",
    api_key=os.getenv("BROWSERBASE_API_KEY"),  # API key for authentication
    project_id=os.getenv("BROWSERBASE_PROJECT_ID"),  # Project identifier
    
    browserbase_session_create_params={
        "projectId": os.getenv("BROWSERBASE_PROJECT_ID"),
        "browserSettings": {
            "blockAds": True,
            "viewport": {
                "width": 1024,
                "height": 768,
            },
        },
    },
))

await stagehand.init()
```
</CodeGroup>
</Tab>
<Tab title="LOCAL">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    headless: false,
    viewport: {
      width: 1024,
      height: 768,
    },
  }
});

await stagehand.init();
```
```python Python
from stagehand import Stagehand, StagehandConfig

stagehand = Stagehand(StagehandConfig(
    env="LOCAL",
    local_browser_launch_options={
        "headless": False,
        "viewport": {
            "width": 1024,
            "height": 768,
        },
    }
))

await stagehand.init()
```
</CodeGroup>
</Tab>
</Tabs>

### Direct your Computer Use Agent

Call `execute` on the agent to assign a task to the agent.

<CodeGroup>
```typescript TypeScript
// Navigate to a website
await stagehand.page.goto("https://www.google.com");

const agent = stagehand.agent({
	// You can use either OpenAI or Anthropic
	provider: "anthropic",
	// The model to use (computer-use-preview for OpenAI)
	model: "claude-sonnet-4-20250514",

	// Customize the system prompt
	instructions: `You are a helpful assistant that can use a web browser.
	Do not ask follow up questions, the user will trust your judgement.`,

	// Customize the API key
	options: {
		apiKey: process.env.ANTHROPIC_API_KEY,
	},
});

// Execute the agent
await agent.execute("Apply for a library card at the San Francisco Public Library");
```

```python Python
import os

# Navigate to a website
await stagehand.page.goto("https://www.google.com")

agent = stagehand.agent({
    # The model to use
    model="computer-use-preview",

    # Customize the system prompt
    instructions="You are a helpful assistant that can use a web browser. Do not ask follow up questions, the user will trust your judgement.",

    # Customize the API key
    options={
        "apiKey": os.getenv("ANTHROPIC_API_KEY"),
    },
})

# Execute the agent
await agent.execute("Apply for a library card at the San Francisco Public Library")
```
</CodeGroup>

You can also define the maximum number of steps the agent can take with:

<CodeGroup>
```typescript TypeScript
await agent.execute({
	instructions: "Apply for a library card at the San Francisco Public Library",
	maxSteps: 10,
});
```

```python Python
await agent.execute(
	"Apply for a library card at the San Francisco Public Library",
	max_steps=10,
)
```
</CodeGroup> 

<Callout icon="code" color="#6ec202" iconType="regular">View or run the example templates [here](https://www.browserbase.com/templates?category=Computer+Use+Agents)</Callout>


================================================
FILE: packages/docs/v2/best-practices/contributing.mdx
================================================
---
title: 'Contribute to Stagehand'
description: 'Best practices for making a meaningful contribution to Stagehand'
---

# Codeowners and Subject-Matter Experts

Any contribution must be explicitly approved by a codeowner. Officially, Stagehand codeowners are as follows:

- [**Paul Klein**](https://github.com/pkiv)
- [**Miguel Gonzalez**](https://github.com/miguelg719)
- [**Sean McGuire**](https://github.com/seanmcguire12)
- [**Anirudh Kamath**](https://github.com/kamath)
- [**Sameel Arif**](https://github.com/sameelarif)
- [**Filip Michalsky**](https://github.com/filip-michalsky)

Special thanks to [Jeremy Press](https://github.com/jeremypress), [Navid Pour](https://github.com/navidkpr), and [all the contributors](https://github.com/browserbase/stagehand/graphs/contributors) for your help in making Stagehand the best browser automation framework.

***Please do not hesitate to reach out to anyone listed here in the [public Discord server](https://stagehand.dev/discord)***

## General Workflow

Get listed as [one of our beloved contributors](https://github.com/browserbase/stagehand/graphs/contributors)!

1. **Discuss your proposed contribution before starting.** Not doing this runs you the risk of entirely discarding something you put considerable time and effort into. You can DM Miguel on [Discord](https://stagehand.dev/discord) for a 1on1 call.
2. **Open a Pull Request.** Create a fork of this repository, and follow [GitHub’s instructions to create a Pull Request](https://docs.github.com/en/pull-requests/collaborating-with-pull-requests/proposing-changes-to-your-work-with-pull-requests/creating-a-pull-request-from-a-fork). This allows our team to review your contribution and leave comments. 
3. **Wait for Review**. We'll do our best to get to your contribution as soon as possible. If it's been 2-3 days and you have yet to receive any comments, DM Miguel on [Discord](https://stagehand.dev/discord)
4. **Merge into `evals` branch.** We don’t let external contributors [run our CI via GitHub Actions](https://github.com/browserbase/stagehand/blob/main/.github/workflows/ci.yml) to prevent spam and misuse. If your contribution passes an initial screen, we’ll run our evals on it
    1. By default, all PRs run the following tests that you can also run from the repo source:
        1. Lint (`npm run lint`) - Runs `prettier` and `eslint`. If this fails, you can most likely run `npm run format` to fix some simple linting errors.
        2. Build (`npm run build`) - Lints and builds TS → JS in `dist/`
        3. End-to-End (`npm run e2e`) - These are deterministic end-to-end Playwright tests to ensure the integrity of basic Playwright functionality of [`stagehand.page`](http://stagehand.page) and `stagehand.context` as well as compatibility with the Browserbase API
        4. Combination (`npm run evals category combination`) - This runs AI-based end-to-end tests using combinations of `act`, `extract`, and `observe` 
    2. If you’re changing anything about `act`, `extract`, or `observe` itself, we might also run specific act/extract/observe evals to ensure existing functionality doesn’t significantly drop.
    
    ![CI](/images/CI.png)
    
5. **Cleanup and merge to main**. Once it’s in `evals`, unfortunately the original contributor can’t make any further changes. The internal Stagehand team will be responsible for cleaning up the code and bringing it into main. 

## Contribution Guidelines

1. **Use draft PRs.** If your PR is a work in progress, please convert it to a draft (see below) while you’re working on it, and mark it for review/add reviewers when you’re ready. This helps us prevent clutter in the review queue.
    
    ![Draft PR](/images/pr_draft.png)
    
2. **Provide a reproducible test plan.** Include an eval (preferred) or example. We can’t merge your PR if we can’t run anything that specifically highlights your contribution. 
    1. Write a script in [`evals/tasks`](https://github.com/browserbase/stagehand/tree/v2/evals/tasks) as `someTask.ts`
    2. Add your script to [`evals.config.json`](https://github.com/browserbase/stagehand/blob/v2/evals/evals.config.json) with default category `combination` (*or act/extract/observe if you’re* *only* *testing* *act/extract/observe*).
3. **Add a changeset.** Run `npx changeset` in TS or `uvx changeset` in Python to add a changeset that will directly reflect in the `CHANGELOG` in the upcoming release.
    1. `patch` - no net new functionality to an end-user
    2. `minor` - some net new functionality to an end-user (new function parameter, new exposed type, etc.)
    3. `major` - you shouldn’t be committing a major change


================================================
FILE: packages/docs/v2/best-practices/cost-optimization.mdx
================================================
---
title: Cost Optimization  
sidebarTitle: Cost Optimization
description: Minimize costs while maintaining automation performance
---

Cost optimization in Stagehand involves balancing LLM inference costs and browser infrastructure costs. This guide provides practical strategies to reduce your automation expenses.

## Quick Wins

Start with these simple optimizations that can reduce costs:

### 1. Use the Right Model for the Job

We don't recommend using larger, more premium models for simple tasks. See our [evaluation results](https://stagehand.dev/evals) for model performance and cost comparisons across different task types.

<CardGroup cols={2}>
<Card title="Model Selection Guide" icon="brain" href="/v2/configuration/models">
  Choose the right LLM for your budget and accuracy requirements
</Card>
<Card title="Evaluation Results" icon="chart-line" href="https://www.stagehand.dev/evals">
  See how different models perform on different tasks
</Card>
</CardGroup>

### 2. Implement Smart Caching

Cache successful actions to avoid repeated LLM calls. Learn the basics in our [Caching Guide](/v2/best-practices/caching):

<CodeGroup>
```typescript TypeScript
// Cache successful actions
const [action] = await page.observe("Click the sign in button");
await setCache("sign_in_button", action);

// Reuse cached action (no LLM cost)
const cachedAction = await getCache("sign_in_button");
if (cachedAction) {
  await page.act(cachedAction);
} else {
  await page.act(action);
}
```
```python Python
# Cache successful actions
actions = await page.observe("Click the sign in button")
action = actions[0]
await set_cache("sign_in_button", action)

# Reuse cached action (no LLM cost)
cached_action = await get_cache("sign_in_button")
if cached_action:
    await page.act(cached_action)
else:
    await page.act(action)
```
</CodeGroup>

<CardGroup cols={1}>
<Card title="Caching Guide" icon="database" href="/v2/best-practices/caching">
  Reduce costs with smart action caching and observe patterns
</Card>
</CardGroup>

### 3. Optimize Browser Sessions

Reuse sessions when possible and set appropriate timeouts. See [Browser Configuration](/v2/configuration/browser) for details:

<CodeGroup>
```typescript TypeScript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionCreateParams: {
    timeout: 1800, // 30 minutes instead of default 1 hour
    keepAlive: true, // Keep session alive between tasks
  }
});
```
```python Python
stagehand = Stagehand(
    env="BROWSERBASE",
    browserbase_session_create_params={
        "timeout": 1800,  # 30 minutes instead of default 1 hour
        "keep_alive": True,  # Keep session alive between tasks
    }
)
```
</CodeGroup>

<CardGroup cols={1}>
<Card title="Browserbase Cost Optimization" icon="window-maximize" href="https://docs.browserbase.com/guides/cost-optimization">
  Optimize Browserbase infrastructure costs and session management
</Card>
</CardGroup>

## Advanced Strategies

### Intelligent Model Switching

Automatically fall back to cheaper models for simple tasks:

<CodeGroup>
```typescript TypeScript
// Use models from least to most expensive based on task complexity
// See stagehand.dev/evals for performance comparisons
async function smartAct(page: Page, prompt: string) {
  const models = ["cheaper-model", "premium-model"];
  
  for (const model of models) {
    try {
      const stagehand = new Stagehand({ modelName: model });
      await stagehand.init();
      const [action] = await stagehand.page.observe(prompt);
      await stagehand.page.act(action);
      return;
    } catch (error) {
      console.log(`Falling back to ${model}...`);
    }
  }
}
```
```python Python
# Use models from least to most expensive based on task complexity
# See stagehand.dev/evals for performance comparisons
async def smart_act(page, prompt: str):
    models = ["cheaper-model", "premium-model"]
    
    for model in models:
        try:
            stagehand = Stagehand(model_name=model)
            await stagehand.init()
            actions = await stagehand.page.observe(prompt)
            action = actions[0]
            await stagehand.page.act(action)
            return
        except Exception:
            print(f"Falling back to {model}...")
```
</CodeGroup>

### Session Pooling

Reuse browser sessions across multiple tasks:

<CodeGroup>
```typescript TypeScript
class SessionManager {
  private sessions = new Map<string, Stagehand>();
  
  async getSession(taskType: string): Promise<Stagehand> {
    if (this.sessions.has(taskType)) {
      return this.sessions.get(taskType)!;
    }
    
    const stagehand = new Stagehand({ env: "BROWSERBASE" });
    await stagehand.init();
    this.sessions.set(taskType, stagehand);
    return stagehand;
  }
}
```
```python Python
class SessionManager:
    def __init__(self):
        self.sessions = {}
    
    async def get_session(self, task_type: str):
        if task_type in self.sessions:
            return self.sessions[task_type]
        
        stagehand = Stagehand(env="BROWSERBASE")
        await stagehand.init()
        self.sessions[task_type] = stagehand
        return stagehand
```
</CodeGroup>

## Cost Monitoring

Track your spending to identify optimization opportunities. See our [Observability Guide](/configuration/observability) for detailed metrics:

<CodeGroup>
```typescript TypeScript
// Monitor token usage
const metrics = stagehand.metrics;
console.log(`Total tokens: ${metrics.totalPromptTokens + metrics.totalCompletionTokens}`);
console.log(`Estimated cost: $${(metrics.totalPromptTokens + metrics.totalCompletionTokens) * 0.00001}`);
```
```python Python
# Monitor token usage
metrics = stagehand.metrics
total_tokens = metrics['total_prompt_tokens'] + metrics['total_completion_tokens']
print(f"Total tokens: {total_tokens}")
print(f"Estimated cost: ${total_tokens * 0.00001:.4f}")
```
</CodeGroup>

<CardGroup cols={1}>
<Card title="Observability & Metrics" icon="chart-line" href="/v2/configuration/observability">
  Monitor usage patterns and track costs in real-time
</Card>
</CardGroup>

## Budget Controls

Set spending limits to prevent unexpected costs:

<CodeGroup>
```typescript TypeScript
class BudgetGuard {
  private dailySpend = 0;
  private maxDailyBudget: number;
  
  constructor(maxDailyBudget: number = 25) {
    this.maxDailyBudget = maxDailyBudget;
  }
  
  checkBudget(estimatedCost: number): void {
    if (this.dailySpend + estimatedCost > this.maxDailyBudget) {
      throw new Error(`Daily budget exceeded: $${this.maxDailyBudget}`);
    }
    this.dailySpend += estimatedCost;
  }
}
```
```python Python
class BudgetGuard:
    def __init__(self, max_daily_budget: float = 25.0):
        self.daily_spend = 0
        self.max_daily_budget = max_daily_budget
    
    def check_budget(self, estimated_cost: float) -> None:
        if self.daily_spend + estimated_cost > self.max_daily_budget:
            raise Exception(f"Daily budget exceeded: ${self.max_daily_budget}")
        self.daily_spend += estimated_cost
```
</CodeGroup>


## Related Resources

<CardGroup cols={2}>
<Card title="Model Selection Guide" icon="brain" href="/v2/configuration/models">
  Choose the right LLM for your budget and accuracy requirements
</Card>

<Card title="Caching Strategies" icon="database" href="/v2/best-practices/caching">
  Reduce costs with smart action caching and observe patterns
</Card>

<Card title="Observability & Metrics" icon="chart-line" href="/v2/configuration/observability">
  Monitor usage patterns and track costs in real-time
</Card>

<Card title="Browser Configuration" icon="window-maximize" href="/v2/configuration/browser">
  Optimize Browserbase infrastructure costs and session management
</Card>
</CardGroup>

================================================
FILE: packages/docs/v2/best-practices/deployments.mdx
================================================
---
title: 'Deploying Stagehand'
description: 'Deploy your AI agents and automations to the cloud'
---

<Tip>
**🌟 Preview: Browser Functions** - Deploy your web automation code directly on Browserbase with browser functions. Scale your `act()` automations in the cloud with zero infrastructure setup. Reach out to hello@browserbase.com to get beta access.
</Tip>

## Deploy on Vercel

Securely run Stagehand on Browserbase inside a Vercel Function. This guide shows a minimal, production-safe HTTP endpoint you can call directly or on a schedule.

### 1. Install Vercel CLI

To download and install Vercel CLI, run one of the following commands:

<CodeGroup>
```bash pnpm
pnpm i -g vercel
```
```bash yarn
yarn global add vercel
```
```bash npm
npm i -g vercel
```
```bash bun
bun add -g vercel
```
</CodeGroup>

### 2. Project layout

```text
your-project/
  api/
    run.ts
  package.json
  tsconfig.json
  vercel.json
```

Create the structure with:

```bash
mkdir -p api
touch api/run.ts package.json vercel.json tsconfig.json
```

### 3. `api/run.ts` (Node.js runtime)

```typescript
// api/run.ts
import type { VercelRequest, VercelResponse } from "@vercel/node";
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod/v3";

export default async function handler(req: VercelRequest, res: VercelResponse): Promise<void> {
  try {
    const stagehand = new Stagehand({
      env: "BROWSERBASE",
      apiKey: process.env.BROWSERBASE_API_KEY!,
      projectId: process.env.BROWSERBASE_PROJECT_ID!,
      disablePino: true,
      modelName: "google/gemini-2.5-flash",
      modelClientOptions: {
        apiKey: process.env.GOOGLE_API_KEY!,
      },
      // optional session params
      browserbaseSessionCreateParams: {
        projectId: process.env.BROWSERBASE_PROJECT_ID!,
        region: "us-west-2",
        browserSettings: {
          blockAds: true,
        },
      },
    });

    await stagehand.init();
    const page = stagehand.page;

    await page.goto("https://www.stagehand.dev/");
    await page.act("click the evals button");

    const { extraction } = await page.extract("extract the fastest model");
    const data = { model: extraction ?? "" };

    await stagehand.close();

    res.status(200).json({ ok: true, data: data.model });
  } catch (err: unknown) {
    const msg = err instanceof Error ? err.message : String(err);
    res.status(500).json({ ok: false, error: msg });
  }
}
```

### 4. `package.json`

```json
{
    "name": "bb-stagehand-on-vercel",
    "private": true,
    "type": "module",
    "engines": { "node": ">=18" },
    "dependencies": {
      "@browserbasehq/stagehand": "^2.4.3",
      "zod": "^3.25.0"
    },
    "devDependencies": {
      "typescript": "^5.6.0",
      "@types/node": "^20.12.12",
      "@vercel/node": "^3.2.20"
    }
}
```

### 5. `tsconfig.json`

```json
{
  "compilerOptions": {
    "target": "ES2022",
    "module": "ES2022",
    "moduleResolution": "node",
    "outDir": ".vercel/output/functions",
    "strict": true,
    "esModuleInterop": true,
    "skipLibCheck": true,
    "types": ["node"]
  },
  "include": ["api/**/*.ts"]
}
```

### 6. `vercel.json`

```json
{
  "$schema": "https://openapi.vercel.sh/vercel.json",
  "functions": {
    "api/run.ts": {
      "maxDuration": 60
    }
  }
}
```

See Vercel's [configuring functions](https://vercel.com/docs/functions/configuring-functions) docs for more details.

### 7. Link your project

Link your local folder to a Vercel project before configuring environment variables:

```bash
# authenticate if needed
vercel login

# link the current directory to a Vercel project (interactive)
vercel link
```

### 8. Environment variables

Do not commit `.env` in production. Add variables via Vercel CLI:

```bash
vercel env add BROWSERBASE_API_KEY
vercel env add BROWSERBASE_PROJECT_ID
# (and your model key if needed)
vercel env add GOOGLE_API_KEY
```

See also: [Browser Environment](/configuration/environment) for details on required variables.

### 9. Test locally

Replicate the Vercel environment locally to exercise your Function before deploying. Run from the project root.

```bash
# ensure dependencies are installed
npm install

# start the local Vercel dev server
vercel dev --listen 5005
```

### 10. Deploy

```bash
vercel
vercel --prod
```

### Execute the function

#### Configure Protection Bypass for Automation

Before invoking the production URL, create a Protection Bypass for Automation:

1. Generate a 32-character secret (you can use `openssl rand -hex 16`)
2. Go to your project in Vercel
3. Navigate to Settings → Deployment Protection
4. Add the secret to "Protection Bypass for Automation"

Then invoke the function with the bypass header:

```bash
curl -X POST \
  -H "x-vercel-protection-bypass: <your-32-character-secret>" \
  https://<your-deployment>/api/run
```

### Optional: Cron on Vercel

Hit the same endpoint on a schedule by extending `vercel.json`:

```json
{
  "$schema": "https://openapi.vercel.sh/vercel.json",
  "functions": {
    "api/run.ts": {
      "maxDuration": 60
    }
  }
  },
  "crons": [
    { "path": "/api/run", "schedule": "0 * * * *" }
  ]
}
```

### Features
- **No local browsers needed** with `env: "BROWSERBASE"`. [Browserbase](https://www.browserbase.com/) provides the browsers.
- **Fast functionality**: Offload browser work to Browserbase and return JSON promptly.
- **Long-running tasks**: Raise `maxDuration` and/or consider Edge runtime limits depending on plan.


================================================
FILE: packages/docs/v2/best-practices/mcp-integrations.mdx
================================================
---
title: "MCP Integrations"
description: "Using Model Context Protocol (MCP) integrations to enhance agent capabilities"
---

## What are MCP Integrations?

MCP (Model Context Protocol) integrations allow you to connect your Stagehand agents to external tools, APIs, and services. This enables agents to perform actions beyond browser automation, such as web search, database operations, and API calls.

<Info>
MCP integrations make your agents more powerful by combining browser automation with external capabilities. The agent can intelligently decide when to use browser actions versus external tools.
</Info>

## Connection Options

There are two options for connecting to MCP servers:

1. **Pass a URL directly** - The simplest approach for quick setup
2. **Create a connection first** - Gives you more control over the connection

<Note>
MCP client support is currently only available in TypeScript.
</Note>

## Passing a URL

The simplest way to add MCP integrations is by providing server URLs directly in the agent configuration:

```typescript
const agent = stagehand.agent({
  provider: "openai",
  model: "computer-use-preview",
  integrations: [
    `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
  ],
  instructions: `You have access to web search through Exa. Use it to find current information before browsing.`,
  options: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});

await agent.execute("Search for the best headphones of 2025 and go through checkout for the top recommendation");
```

## Creating a Connection First

Alternatively, you can establish MCP connections first and then pass the client objects:

```typescript
import { connectToMCPServer } from "@browserbasehq/stagehand";

// Connect to MCP server
const supabaseClient = await connectToMCPServer(
  `https://server.smithery.ai/@supabase-community/supabase-mcp/mcp?api_key=${process.env.SMITHERY_API_KEY}`
);

// You can also pass the config to start a local MCP server
const notionClient = await connectToMCPServer({
  command: "npx",
  args: ["-y", "@notionhq/notion-mcp-server"],
  env: {
    NOTION_TOKEN: process.env.NOTION_TOKEN,
  },
});

// Use the connected client
const agent = stagehand.agent({
  provider: "openai", 
  model: "computer-use-preview",
  integrations: [supabaseClient, notionClient],
  instructions: `You can interact with Supabase databases and Notion. Use these tools to store and retrieve data.`,
  options: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});

await agent.execute("Search for restaurants in New Brunswick, NJ and save the first result to the database");
```


## Multiple Integrations

You can combine multiple MCP integrations in a single agent:

```typescript
const databaseClient = await connectToMCPServer(/* database config */);

const agent = stagehand.agent({
  integrations: [
    `https://search-service.example.com/mcp?apiKey=${process.env.SEARCH_API_KEY}`,
    databaseClient
  ],
  instructions: `You have access to external tools for search and data storage. Use these tools strategically to complete tasks efficiently.`
});
```

## Best Practices

### Choose the Right Connection Approach
<Tabs>
<Tab title="Passing a URL">
**When to use:**
- Simple setup requirements
- Standard API configurations
- Getting started quickly

**Benefits:**
- Minimal code required
- Automatic connection handling
- Easy to configure
</Tab>

<Tab title="Creating a Connection First">
**When to use:**
- Custom connection options
- Connection reuse across agents
- Advanced error handling

**Benefits:**
- Full control over connections
- Better error handling
- Connection pooling capabilities
</Tab>
</Tabs>

### Environment Variables

Always use environment variables for API keys and sensitive information:

```bash
# .env file
SEARCH_API_KEY=your_search_service_key
MCP_SERVICE_API_KEY=your_mcp_service_key
OPENAI_API_KEY=your_openai_key
DATABASE_URL=your_database_url
DATABASE_API_KEY=your_database_key
```

### Instructions Best Practices

Provide clear instructions about available tools:

<Tabs>
<Tab title="Good Instructions">
```typescript
instructions: `You have access to:
1. Web search tools - Use to find current information
2. Database tools - Use to store/retrieve data
3. Browser automation - Use for web interactions

Always search for current information before making decisions.
Store important data for later reference.`
```
</Tab>

<Tab title="Poor Instructions">
```typescript
instructions: "You can search and save data."
```
</Tab>
</Tabs>

### Error Handling

Implement proper error handling for MCP connections:

```typescript
try {
  const client = await connectToMCPServer(serverUrl);
  
  const agent = stagehand.agent({
    integrations: [client],
    // ... other config
  });
  
  const result = await agent.execute(instruction);
} catch (error) {
  console.error("MCP integration failed:", error);
  // Handle fallback behavior
}
```

## Troubleshooting

<AccordionGroup>
<Accordion title="Connection timeouts">
**Problem:** MCP server connections timing out

**Solutions:**
- Verify server URLs are correct and accessible
- Check network connectivity
- Ensure API keys are valid and have proper permissions
- Try connecting to servers individually to isolate issues
</Accordion>

<Accordion title="Tool not being used">
**Problem:** Agent not using available MCP tools

**Solutions:**
- Make instructions more specific about when to use tools
- Ensure API keys are properly configured
- Check that the MCP server supports the expected tools
- Verify tool descriptions are clear and actionable
</Accordion>

<Accordion title="Authentication errors">
**Problem:** API key or authentication failures

**Solutions:**
- Verify all required environment variables are set
- Check API key validity and permissions  
- Ensure URLs include necessary authentication parameters
- Test MCP connections independently before using in agents
</Accordion>
</AccordionGroup>

## Examples

### Web Search + Browser Automation
```typescript
const agent = stagehand.agent({
  integrations: [`https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`],
  instructions: `First search for current information, then use the browser to complete tasks based on what you find.`
});

await agent.execute("Find the best laptop deals for 2025 and navigate to purchase the top recommendation");
```

### Data Extraction + Storage
```typescript
const supabaseClient = await connectToMCPServer(/* config */);

const agent = stagehand.agent({
  integrations: [supabaseClient],
  instructions: `Extract data from websites and store it using available database tools.`
});

await agent.execute("Extract all restaurant information from this directory and save it to the database");
```

### Multi-tool Workflow
```typescript
const agent = stagehand.agent({
  integrations: [
    `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
    supabaseClient
  ],
  instructions: `Use all available tools strategically: search for current info, browse websites, and store important data.`
});

await agent.execute("Research competitor pricing, compare with our site, and store the analysis");
```

## Further Reading

<CardGroup cols={3}>
<Card title="Agent Basics" icon="robot" href="/v2/basics/agent">
  Learn the fundamentals of Stagehand agents
</Card>

<Card title="MCP Server Setup" icon="server" href="/v2/integrations/mcp/setup">  
  Set up your own MCP server
</Card>

<Card title="Custom Tools" icon="wrench" href="/v2/integrations/mcp/tools">
  Create custom MCP tools
</Card>
</CardGroup>


================================================
FILE: packages/docs/v2/best-practices/playwright-interop.mdx
================================================
---
title: 'Playwright Interoperability'
description: 'How Stagehand interacts with Playwright'
---

Stagehand is built on top of [Playwright](https://playwright.dev/), so you can use Playwright methods directly through the Stagehand instance.

## `page` and `context`

`stagehand.page` and `stagehand.context` are instances of Playwright's `Page` and `BrowserContext` respectively. Use these methods to interact with the Playwright instance that Stagehand is using.

<CodeGroup>
```TypeScript TypeScript
const page = stagehand.page;
// Base Playwright methods work
await page.goto("https://github.com/browserbase/stagehand");

// Stagehand overrides Playwright objects
await page.act("click on the contributors")
```

```python Python
page = stagehand.page
# Base Playwright methods work
await page.goto("https://github.com/browserbase/stagehand")

# Stagehand overrides Playwright objects
await page.act("click on the contributors")
```
</CodeGroup>

## Stagehand v. Playwright
Below is an example of how to extract a list of companies from the AI Grant website using both Stagehand and Playwright.

<img src="/images/stagehand-playwright.png" alt="Stagehand v. Playwright" />

The above example with Stagehand can be easily reused to extract data from other websites, whereas the Playwright example would need to be rewritten for each new website.

================================================
FILE: packages/docs/v2/best-practices/prompting-best-practices.mdx
================================================
---
title: Prompting Best Practices
description: "Write effective prompts for reliable Stagehand automation"
---

Good prompts make Stagehand reliable. Bad prompts cause failures. Here's how to write prompts that work consistently.

## Act Method

Use `act()` for single actions on web pages. Each action should be focused and clear.

<CodeGroup>
```typescript TypeScript
// Good - Single, specific actions
await page.act("click the 'Add to Cart' button");
await page.act("type 'user@example.com' into the email field");

// Bad - Multiple actions combined
await page.act("fill out the form and submit it");
await page.act("login with credentials and navigate to dashboard");
```

```python Python
# Good - Single, specific actions
await page.act("click the 'Add to Cart' button")
await page.act("type 'user@example.com' into the email field")

# Bad - Multiple actions combined
await page.act("fill out the form and submit it")
await page.act("login with credentials and navigate to dashboard")
```
</CodeGroup>

### Use Element Types, Not Colors

Describe elements by their type and function rather than visual attributes like color.

<CodeGroup>
```typescript TypeScript
// Good - Element types and descriptive text
await page.act("click the 'Sign In' button");
await page.act("type into the email input field");

// Bad - Color-based descriptions
await page.act("click the blue button");
await page.act("type into the white input");
```

```python Python
# Good - Element types and descriptive text
await page.act("click the 'Sign In' button")
await page.act("type into the email input field")

# Bad - Color-based descriptions
await page.act("click the blue button")
await page.act("type into the white input")
```
</CodeGroup>

### Use Descriptive Language

<CodeGroup>
```typescript TypeScript
// Good - Clear element identification
await page.act("click the 'Next' button at the bottom of the form");
await page.act("type into the search bar at the top of the page");

// Bad - Vague descriptions
await page.act("click next");
await page.act("type into search");
```

```python Python
# Good - Clear element identification
await page.act("click the 'Next' button at the bottom of the form")
await page.act("type into the search bar at the top of the page")

# Bad - Vague descriptions
await page.act("click next")
await page.act("type into search")
```
</CodeGroup>

### Choose the Right Action Verbs

- **Click** for buttons, links, checkboxes
- **Type** for text inputs
- **Select** for dropdowns
- **Check/uncheck** for checkboxes
- **Upload** for file inputs

<CodeGroup>
```typescript TypeScript
// Good
await page.act("click the submit button");
await page.act("select 'Option 1' from dropdown");

// Bad
await page.act("click submit");
await page.act("choose option 1");
```

```python Python
# Good
await page.act("click the submit button")
await page.act("select 'Option 1' from dropdown")

# Bad
await page.act("click submit")
await page.act("choose option 1")
```
</CodeGroup>

### Protect Sensitive Data

Variables keep sensitive information out of prompts and logs.

<CodeGroup>
```typescript TypeScript
// Good - Secure approach
await page.act({
  action: "enter %username% in the email field",
  variables: {
    username: "user@example.com"
  }
});

await page.act({
  action: "enter %password% in the password field", 
  variables: {
    password: process.env.USER_PASSWORD
  }
});

// Bad - Insecure approach
await page.act("type 'mySecretPassword123' into the password field");
```

```python Python
import os

# Good - Secure approach
await page.act(
  "enter %username% in the email field",
  variables={
    "username": "user@example.com"
  }
)

await page.act(
  "enter %password% in the password field",
  variables={
    "password": os.environ.get("USER_PASSWORD")
  }
)

# Bad - Insecure approach
await page.act("type 'mySecretPassword123' into the password field")
```
</CodeGroup>

<Warning>
Set `verbose: 0` in your Stagehand config to prevent secrets from appearing in logs.
</Warning>

## Extract Method

Use `extract()` to pull structured data from pages. Define clear schemas and provide context.

### Schema Best Practices

Use descriptive field names, correct types, and detailed descriptions. Field descriptions provide context that helps the agent understand exactly what to extract.

<CodeGroup>
```typescript TypeScript
// Good - Descriptive names, correct types, and helpful descriptions
const productData = await page.extract({
  instruction: "Extract product information",
  schema: z.object({
    productTitle: z.string().describe("The main product name displayed on the page"),
    priceInDollars: z.number().describe("Current selling price as a number, without currency symbol"),
    isInStock: z.boolean().describe("Whether the product is available for purchase")
  })
});

// Bad - Generic names, wrong types, no descriptions
const data = await page.extract({
  instruction: "Get product details", 
  schema: z.object({
    name: z.string(), // Too generic, no context
    price: z.string(), // Should be number
    stock: z.string() // Should be boolean, no context
  })
});
```

```python Python
from pydantic import BaseModel, Field

# Good - Descriptive names, correct types, and helpful descriptions
class ProductData(BaseModel):
    productTitle: str = Field(description="The main product name displayed on the page")
    priceInDollars: float = Field(description="Current selling price as a number, without currency symbol")
    isInStock: bool = Field(description="Whether the product is available for purchase")

productData = await page.extract(
  "Extract product information",
  schema=ProductData
)

# Bad - Generic names, wrong types, no descriptions
class Data(BaseModel):
    name: str      # Too generic, no context
    price: str     # Should be float, no context
    stock: str     # Should be bool, no context

data = await page.extract(
  "Get product details",
  schema=Data
)
```
</CodeGroup>

### Handle Arrays Correctly

Always wrap schemas in objects for reliable extraction.

<CodeGroup>
```typescript TypeScript
// Good - Array wrapped in object
const listings = await page.extract({
  instruction: "Extract all apartment listings",
  schema: z.object({
    apartments: z.array(z.object({
      address: z.string(),
      rent: z.number()
    }))
  })
});

// Bad - Bare array
const listings = await page.extract({
  instruction: "Extract apartment listings",
  schema: z.array(z.string()) // Don't do this
});
```

```python Python
from pydantic import BaseModel
from typing import List

# Good - Array wrapped in object
class Apartment(BaseModel):
    address: str
    rent: float

class Listings(BaseModel):
    apartments: List[Apartment]

listings = await page.extract(
  "Extract all apartment listings",
  schema=Listings
)

# Bad - Bare array (not supported)
# Don't do this - arrays must be wrapped in objects
```
</CodeGroup>

### Use Proper URL Types

Specify URL types to tell Stagehand to extract URLs. Without proper URL types, Stagehand won't extract URLs.

<CodeGroup>
```typescript TypeScript
// Good - Tells Stagehand to extract URLs
const links = await page.extract({
  instruction: "Extract navigation links",
  schema: z.object({
    links: z.array(z.object({
      text: z.string(),
      url: z.string().url() // Required for URL extraction
    }))
  })
});
```

```python Python
from pydantic import BaseModel, HttpUrl
from typing import List

# Good - Tells Stagehand to extract URLs
class Link(BaseModel):
    text: str
    url: HttpUrl  # Required for URL extraction

class Links(BaseModel):
    links: List[Link]

links = await page.extract(
  "Extract navigation links",
  schema=Links
)
```
</CodeGroup>

## Observe Method

Use `observe()` to discover actionable elements before acting on them.

### Check Elements First

Verify elements exist before taking action to avoid errors.

<CodeGroup>
```typescript TypeScript
// Check for elements first
const loginButtons = await page.observe("Find the login button");

if (loginButtons.length > 0) {
  await page.act(loginButtons[0]);
} else {
  console.log("No login button found");
}
```

```python Python
# Check for elements first
login_buttons = await page.observe("Find the login button")

if len(login_buttons) > 0:
    await page.act(login_buttons[0])
else:
    print("No login button found")
```
</CodeGroup>

### Be Specific About Element Types

<CodeGroup>
```typescript TypeScript
// Good - Specific element types
const submitButtons = await page.observe("Find submit button in the form");
const dropdowns = await page.observe("Find the state dropdown menu");

// Bad - Too vague
const elements = await page.observe("Find submit stuff");
const things = await page.observe("Find state selection");
```

```python Python
# Good - Specific element types
submit_buttons = await page.observe("Find submit button in the form")
dropdowns = await page.observe("Find the state dropdown menu")

# Bad - Too vague
elements = await page.observe("Find submit")
things = await page.observe("Find state selection")
```
</CodeGroup>

## Agent Method

Use `agent()` for complex, multi-step workflows. Provide detailed instructions and set appropriate limits.

### Navigate First

Don't include navigation in agent tasks. Handle it separately.

<CodeGroup>
```typescript TypeScript
// Good - Navigate first
await page.goto('https://amazon.com');
await agent.execute('Search for wireless headphones under $100 and add the best rated one to cart');

// Bad - Navigation in task
await agent.execute('Go to Amazon, search for headphones, and add one to cart');
```

```python Python
# Good - Navigate first
await page.goto('https://amazon.com')
await agent.execute('Search for wireless headphones under $100 and add the best rated one to cart')

# Bad - Navigation in task
await agent.execute('Go to Amazon, search for headphones, and add one to cart')
```
</CodeGroup>

### Be Highly Specific

Detailed instructions lead to better results.

<CodeGroup>
```typescript TypeScript
// Good - Detailed instructions
await agent.execute({
  instruction: "Find Italian restaurants in Brooklyn that are open after 10pm, have outdoor seating, and are rated 4+ stars. Save the top 3 results.",
  maxSteps: 25
});

// Bad - Vague instructions
await agent.execute("Find some good restaurants");
```

```python Python
# Good - Detailed instructions
await agent.execute(
  instruction="Find Italian restaurants in Brooklyn that are open after 10pm, have outdoor seating, and are rated 4+ stars. Save the top 3 results.",
  max_steps=25
)

# Bad - Vague instructions
await agent.execute("Find some good restaurants")
```
</CodeGroup>

### Set Appropriate Step Limits

Match step limits to task complexity.

<CodeGroup>
```typescript TypeScript
// Simple task - fewer steps
await agent.execute({
  instruction: "Subscribe to the newsletter with email 'user@example.com'",
  maxSteps: 10
});

// Complex task - more steps  
await agent.execute({
  instruction: "Research and compare 5 project management tools with pricing and features",
  maxSteps: 50
});
```

```python Python
# Simple task - fewer steps
await agent.execute(
  instruction="Subscribe to the newsletter with email 'user@example.com'",
  max_steps=10
)

# Complex task - more steps
await agent.execute(
  instruction="Research and compare 5 project management tools with pricing and features",
  max_steps=50
)
```
</CodeGroup>

### Include Success Criteria

Tell the agent how to know when it's done.

<CodeGroup>
```typescript TypeScript
// Good - Clear success criteria
await agent.execute({
  instruction: "Add 3 smartphone cases to cart and confirm the cart shows exactly 3 items with total price",
  maxSteps: 20
});

// Bad - No validation
await agent.execute("Add some items to cart");
```

```python Python
# Good - Clear success criteria
await agent.execute(
  instruction="Add 3 smartphone cases to cart and confirm the cart shows exactly 3 items with total price",
  max_steps=20
)

# Bad - No validation
await agent.execute("Add some items to cart")
```
</CodeGroup>

## Common Mistakes to Avoid

- **Combining multiple actions** - Keep each `act()` call to one action
- **Using vague descriptions** - Be specific about which elements to interact with  
- **Exposing sensitive data** - Always use variables for credentials
- **Skipping validation** - Check results before proceeding

## Testing Your Prompts

1. **Start simple** - Test basic functionality first
2. **Add complexity gradually** - Build up to complex workflows
3. **Monitor results** - Use logging to understand what's happening
4. **Iterate based on failures** - Refine prompts when they don't work
Remember: Good prompting is iterative. When in doubt, be more specific rather than less.

================================================
FILE: packages/docs/v2/best-practices/speed-optimization.mdx
================================================
---
title: Speed Optimization
sidebarTitle: Speed Optimization
description: Optimize Stagehand performance for faster automation and reduced latency
---

Stagehand performance depends on several factors: DOM processing speed, LLM inference time, browser operations, and network latency. This guide provides proven strategies to maximize automation speed.

## Quick Performance Wins

### 1. Plan Ahead with Observe


Use a single `observe()` call to plan multiple actions, then execute them efficiently:

<CodeGroup>
```typescript TypeScript
// Instead of sequential operations with multiple LLM calls
await page.act("Fill name field");        // LLM call #1
await page.act("Fill email field");       // LLM call #2
await page.act("Select country dropdown"); // LLM call #3

// Use single observe to plan all form fields - one LLM call
const formFields = await page.observe("Find all form fields to fill");

// Execute all actions without LLM inference
for (const field of formFields) {
  await page.act(field); // No LLM calls!
}
```
```python Python
import asyncio

# Instead of sequential operations with multiple LLM calls
await page.act("Fill name field")        # LLM call #1
await page.act("Fill email field")       # LLM call #2  
await page.act("Select country dropdown") # LLM call #3

# Use single observe to plan all form fields - one LLM call
form_fields = await page.observe("Find all form fields to fill")

# Execute all actions without LLM inference
for field in form_fields:
    await page.act(field) # No LLM calls!

```
</CodeGroup>

<Note>
**Performance Tip**: Acting on `observe` results avoids LLM inference entirely. This approach is 2-3x faster than direct `act()` calls and is the recommended pattern for multi-step workflows.
</Note>

<Card title="Caching Guide" icon="database" href="/v2/best-practices/caching">
  Learn advanced caching patterns and cache invalidation strategies
</Card>

### 2. Optimize DOM Processing

Reduce DOM complexity before Stagehand processes the page:

<CodeGroup>
```typescript TypeScript
// Remove heavy elements that slow down processing
await page.evaluate(() => {
  // Remove video elements
  document.querySelectorAll('video, iframe').forEach(el => el.remove());
  
  // Hide complex animations
  document.querySelectorAll('[style*="animation"]').forEach(el => {
    (el as HTMLElement).style.animation = 'none';
  });
});

// Then perform Stagehand operations
await page.act("Click the submit button");
```
```python Python
# Remove heavy elements that slow down processing
await page.evaluate("""
() => {
  // Remove video elements
  document.querySelectorAll('video, iframe').forEach(el => el.remove());
  
  // Hide complex animations
  document.querySelectorAll('[style*="animation"]').forEach(el => {
    el.style.animation = 'none';
  });
}
""")

# Then perform Stagehand operations
await page.act("Click the submit button")
```
</CodeGroup>

### 3. Set Appropriate Timeouts

Use shorter timeouts for simple operations and longer ones for complex page loads:

<CodeGroup>
```typescript TypeScript
// Simple actions - reduce action timeout
await page.act({ 
  instruction: "Click the login button",
  actTimeout: 5000  // Default is 30000ms, reduce for simple clicks
});

// Complex page loads - optimize navigation
await page.goto("https://heavy-spa.com", {
  waitUntil: "domcontentloaded", // Don't wait for all resources
  timeout: 15000 // Shorter than default 30s
});
```
```python Python
# Simple actions - reduce action timeout
await page.act("Click button", act_timeout=5000)


# Complex page loads - optimize navigation
await page.goto("https://heavy-spa.com", 
    wait_until="domcontentloaded",
    timeout=15000
)
```
</CodeGroup>

## Advanced Performance Strategies


### Smart Model Selection

Use faster models for simple tasks, premium models only when needed:

<CodeGroup>
```typescript TypeScript
class SpeedOptimizedStagehand {
  private fastModel: Stagehand;
  private premiumModel: Stagehand;

  async smartAct(page: Page, prompt: string, complexity: 'simple' | 'complex') {
    const model = complexity === 'simple' ? this.fastModel : this.premiumModel;
    return await model.page.act(prompt);
  }
}

// Use fast model for simple clicks/forms
await stagehand.smartAct(page, "Click submit", 'simple');

// Use premium model for complex reasoning
await stagehand.smartAct(page, "Find the cheapest flight option", 'complex');
```
```python Python
class SpeedOptimizedStagehand:
    def __init__(self):
        self.fast_model = Stagehand(model_name="fast-model")
        self.premium_model = Stagehand(model_name="premium-model")
    
    async def smart_act(self, page, prompt: str, complexity: str):
        model = self.fast_model if complexity == 'simple' else self.premium_model
        return await model.page.act(prompt)

# Use fast model for simple clicks/forms
await stagehand.smart_act(page, "Click submit", 'simple')

# Use premium model for complex reasoning  
await stagehand.smart_act(page, "Find the cheapest flight option", 'complex')
```
</CodeGroup>

<Card title="Model Configuration" icon="brain" href="/v2/configuration/models">
  Compare model performance and costs
</Card>

### Page Load Optimization

Skip unnecessary resources during page loads:

<CodeGroup>
```typescript TypeScript
// Block heavy resources globally
await context.route('**/*', (route) => {
  const resourceType = route.request().resourceType();
  if (['image', 'font', 'media'].includes(resourceType)) {
    route.abort();
  } else {
    route.continue();
  }
});

// Use faster navigation
await page.goto(url, { 
  waitUntil: 'domcontentloaded',  // Don't wait for images/fonts
  timeout: 10000 
});
```
```python Python
# Block heavy resources globally
async def handle_route(route):
    resource_type = route.request.resource_type
    if resource_type in ['image', 'font', 'media']:
        await route.abort()
    else:
        await route.continue_()

await context.route('**/*', handle_route)

# Use faster navigation
await page.goto(url, 
    wait_until='domcontentloaded',  # Don't wait for images/fonts
    timeout=10000
)
```
</CodeGroup>
<Card title="Cost Optimization" icon="dollar-sign" href="/v2/best-practices/cost-optimization">
  Balance speed with cost considerations
</Card>

## Performance Monitoring and Benchmarking

Track performance metrics and measure optimization impact:

### Performance Tracking

<CodeGroup>
```typescript TypeScript
class PerformanceTracker {
  private speedMetrics: Map<string, number[]> = new Map();

  async timedAct(page: Page, prompt: string): Promise<ActResult> {
    const start = Date.now();
    const result = await page.act(prompt);
    const duration = Date.now() - start;
    
    if (!this.speedMetrics.has(prompt)) {
      this.speedMetrics.set(prompt, []);
    }
    this.speedMetrics.get(prompt)!.push(duration);
    
    console.log(`Action "${prompt}" took ${duration}ms`);
    return result;
  }

  getAverageTime(prompt: string): number {
    const times = this.speedMetrics.get(prompt) || [];
    return times.reduce((a, b) => a + b, 0) / times.length;
  }
}
```
```python Python
import time
from collections import defaultdict

class PerformanceTracker:
    def __init__(self):
        self.speed_metrics = defaultdict(list)
    
    async def timed_act(self, page, prompt: str):
        start = time.time()
        result = await page.act(prompt)
        duration = (time.time() - start) * 1000  # Convert to ms
        
        self.speed_metrics[prompt].append(duration)
        print(f'Action "{prompt}" took {duration:.0f}ms')
        return result
    
    def get_average_time(self, prompt: str) -> float:
        times = self.speed_metrics[prompt]
        return sum(times) / len(times) if times else 0
```
</CodeGroup>

Example Output:
```
Action "Fill form" took 1000ms
Action "Click submit" took 2000ms
Action "Confirm submission" took 5000ms
```

### Before vs After Benchmarking

<CodeGroup>
```typescript TypeScript
// Before optimization
console.time("workflow");
await page.act("Fill form");
await page.act("Click submit");
await page.act("Confirm submission");
console.timeEnd("workflow"); // 8000ms

// After optimization with observe planning
console.time("workflow-optimized");
const workflowActions = await page.observe("Find form, submit, and confirm elements");

// Execute actions sequentially to avoid conflicts
for (const action of workflowActions) {
  await page.act(action);
}
console.timeEnd("workflow-optimized"); // 500ms
```
```python Python
import time

# Before optimization  
start = time.time()
await page.act("Fill form")
await page.act("Click submit") 
await page.act("Confirm submission")
print(f"Workflow took {(time.time() - start) * 1000:.0f}ms")  # 8000ms

# After optimization with observe planning
start = time.time()
workflow_actions = await page.observe("Find form, submit, and confirm elements")

# Execute actions sequentially to avoid conflicts
for action in workflow_actions:
    await page.act(action)
print(f"Optimized workflow took {(time.time() - start) * 1000:.0f}ms")  # 500ms
```
</CodeGroup>

Example Output:
```
Workflow took 8000ms
Optimized workflow took 500ms
```

<CardGroup cols={1}>
<Card title="Observability & Metrics" icon="chart-line" href="/v2/configuration/observability">
  Set up comprehensive performance monitoring
</Card>
</CardGroup>


## Related Resources

<CardGroup cols={2}>
<Card title="Caching Strategies" icon="database" href="/v2/best-practices/caching">
  Advanced caching patterns for maximum performance
</Card>

<Card title="Cost Optimization" icon="dollar-sign" href="/v2/best-practices/cost-optimization">
  Balance speed improvements with cost considerations
</Card>

<Card title="Browser Configuration" icon="window-maximize" href="/v2/configuration/browser">
  Optimize Browserbase settings for speed
</Card>

<Card title="Model Selection" icon="brain" href="/v2/configuration/models">
  Choose the right model for speed vs accuracy
</Card>
</CardGroup>

================================================
FILE: packages/docs/v2/best-practices/usecase-observe.mdx
================================================
---
sidebarTitle: Use Cases
---

## Real-World Use Cases

### E-commerce Product Discovery

```typescript
// Discover product interaction elements
const productActions = await page.observe({
  instruction: "Find add to cart buttons, size selectors, and product images"
});

// Categorize actions by type
const cartButtons = productActions.filter(a => 
  a.description.toLowerCase().includes('cart')
);
const sizeOptions = productActions.filter(a => 
  a.description.toLowerCase().includes('size')
);

// Execute purchase workflow
if (sizeOptions.length > 0) {
  await page.act(sizeOptions[0]); // Select size first
}
if (cartButtons.length > 0) {
  await page.act(cartButtons[0]); // Then add to cart
}
```

### Form Handling & Validation

```typescript
// Analyze form structure before filling
const formElements = await page.observe({
  instruction: "Find form fields, validation messages, and submit buttons"
});

// Check for required fields
const requiredFields = formElements.filter(e => 
  e.description.includes('required') || e.description.includes('*')
);

console.log(`Found ${requiredFields.length} required fields to complete`);

// Fill form systematically
for (const field of requiredFields) {
  await page.act(field);
  // Add appropriate input based on field type
}
```

### Dynamic Content & SPA Navigation

```typescript
// Wait for and discover dynamically loaded content
await page.waitForLoadState('networkidle');

const dynamicElements = await page.observe({
  instruction: "Find newly loaded content, infinite scroll triggers, or loading indicators",
  domSettleTimeoutMs: 15000 // Wait longer for dynamic content
});

// Handle infinite scroll
const scrollTriggers = dynamicElements.filter(e => 
  e.description.toLowerCase().includes('load more') ||
  e.description.toLowerCase().includes('scroll')
);

if (scrollTriggers.length > 0) {
  await page.act(scrollTriggers[0]);
  // Recursively observe new content
  const newContent = await page.observe("Find additional items");
}
```

### Multi-Step Workflow Planning

```typescript
// Plan entire checkout flow upfront
async function planCheckoutWorkflow() {
  // Step 1: Cart page analysis
  await page.goto('/cart');
  const cartActions = await page.observe("Find checkout and cart modification options");
  
  // Step 2: Checkout page analysis  
  const checkoutButton = cartActions.find(a => a.description.includes('checkout'));
  if (checkoutButton) await page.act(checkoutButton);
  
  const checkoutActions = await page.observe("Find payment forms and shipping options");
  
  // Step 3: Plan execution order
  const shippingFields = checkoutActions.filter(a => a.description.includes('shipping'));
  const paymentFields = checkoutActions.filter(a => a.description.includes('payment'));
  const submitButton = checkoutActions.find(a => a.description.includes('complete order'));
  
  return { shippingFields, paymentFields, submitButton };
}

// Execute planned workflow
const workflow = await planCheckoutWorkflow();
// Fill shipping → payment → submit
```


================================================
FILE: packages/docs/v2/best-practices/user-data.mdx
================================================
---
title: User Data Directory
sidebarTitle: User Data
description: Persist browser data between sessions
---

### User Data Directory

Persist browser data between sessions using a custom user data directory:

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

// For Browserbase sessions
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionCreateParams: {
    userDataDir: "/path/to/user/data/directory",
  },
});

// For Local sessions
const localStagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    userDataDir: "./browser-data",
  },
});

await stagehand.init();
console.log("Session ID:", stagehand.sessionId);
```
```python Python
from stagehand import Stagehand

# For Browserbase sessions
stagehand = Stagehand(
    env="BROWSERBASE",
    browserbase_session_create_params={
        "user_data_dir": "/path/to/user/data/directory",
    },
)

# For Local sessions
local_stagehand = Stagehand(
    env="LOCAL",
    local_browser_launch_options={
        "user_data_dir": "./browser-data",
    },
)

await stagehand.init()
print(f"Session ID: {stagehand.session_id}")
```
</CodeGroup>

================================================
FILE: packages/docs/v2/best-practices/using-multiple-tabs.mdx
================================================
---
title: 'Using Multiple Tabs'
description: 'Act on multiple tabs with Stagehand'
---

Many modern web applications open new tabs when users click certain buttons or links. Without proper multitab support, automation scripts break when expected content appears in a new tab rather than the current one. Stagehand's multitab capabilities ensure your automations work seamlessly across multitab workflows.

## The Stagehand Page

Stagehand automatically adapts to multitab workflows. The `stagehand.page` object always points to the most recently opened or active tab, ensuring your automations continue working even when new tabs are created.

This means you can continue using familiar patterns:

<CodeGroup>
```typescript TypeScript
const page = stagehand.page;
await page.goto("https://example.com");
await page.act("click the button that opens a new tab");
// page now automatically points to the new tab
await page.extract("get data from new tab");
```

```python Python
page = stagehand.page
await page.goto("https://example.com")
await page.act("click the button that opens a new tab")
# page now automatically points to the new tab
await page.extract("get data from new tab")
```
</CodeGroup>

<Warning>
**Important**: [Stagehand Agent](/v2/basics/agent) will always operate on the `stagehand.page`. If you need an agent to work across specific tabs, you'll need to manage page switching manually.
</Warning>

## Manual Page Management

For more control or multitab workflows, you can manage multiple tabs explicitly:

<CodeGroup>
```typescript TypeScript
// Create a second page
await stagehand.context.newPage();
const pages = stagehand.context.pages();

const githubPage = pages[0];
const pythonPage = pages[1];

// Navigate each page to different repositories
await githubPage.goto("https://github.com/browserbase/stagehand");
await pythonPage.goto("https://github.com/browserbase/stagehand-python");

// Extract data from both pages simultaneously
const [stagehandStars, stagehandPythonStars] = await Promise.all([
  githubPage.extract("extract the repository stars"),
  pythonPage.extract("extract the repository stars")
]);

console.log(`Stagehand stars: ${stagehandStars}`);
console.log(`Stagehand-Python stars: ${stagehandPythonStars}`);
```

```python Python
# Create a second page
await stagehand.context.new_page()
pages = stagehand.context.pages()

github_page = pages[0]
python_page = pages[1]

# Navigate each page to different repositories  
await github_page.goto("https://github.com/browserbase/stagehand")
await python_page.goto("https://github.com/browserbase/stagehand-python")

# Extract data from both pages
stagehand_stars = await github_page.extract("extract the repository stars")
stagehand_python_stars = await python_page.extract("extract the repository stars")

print(f"Stagehand stars: {stagehand_stars}")
print(f"Stagehand-Python stars: {stagehand_python_stars}")
```
</CodeGroup>

## Handling Tab Events

You can also listen for tab events to control what happens when new tabs are opened:

<CodeGroup>
```typescript TypeScript
const page = stagehand.page;
await page.goto("https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/");

// close the new tab after it's opened
page.on("popup", async () => {
  const newPage = stagehand.context.pages()[1];
  await newPage.close();
});

await page.act("click the button to open the other page");

const page_number = await page.extract("extract the page number");
console.log(`You're on page ${page_number}`);
```

```python Python
page = stagehand.page
await page.goto("https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/")

# Close the new tab after it's opened
async def handle_popup():
    new_page = stagehand.context.pages()[1]
    await new_page.close()

page.on("popup", handle_popup)

await page.act("click the button to open the other page")

page_number = await page.extract("extract the page number")
print(f"You're on page {page_number}")
```
</CodeGroup>

## Next Steps

<CardGroup cols={2}>
  <Card title="Orchestrate complex workflows with Agent" icon="robot" iconType="sharp-solid" href="/v2/basics/agent">
    Use `Agent` to autonomously execute multi-step tasks and complex workflows.
  </Card>

  <Card title="Working with iframes" icon="frame" iconType="sharp-solid" href="/v2/best-practices/working-with-iframes">
    Learn best practices for interacting with elements inside iframes.
  </Card>

  <Card title="Browser Configuration" icon="browser" iconType="sharp-solid" href="/v2/configuration/browser">
    Manage browser contexts and sessions for complex automation scenarios.
  </Card>

  <Card title="Logging & Debugging" icon="bug" iconType="sharp-solid" href="/v2/configuration/logging">
    Handle errors gracefully and debug automation issues effectively.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/best-practices/working-with-iframes.mdx
================================================
---
title: Working with iframes
---

### What is an iframe?

Iframes embed other pages within your current page. Sites use them for consent banners, payment widgets, chat bubbles, and third-party content.
Elements inside iframes exist in a separate context than the main page.

### Enable iframe support

Set `iframes: true` in your `act()`, `observe()`, and `extract()` commands.

<CodeGroup>
```typescript TypeScript
// Act within iframes
await page.act({ action: "click the accept cookies button", iframes: true });

// Observe within iframes
const results = await page.observe({
  instruction: "Find the primary action button",
  iframes: true,
});

// Extract from iframes
const data = await page.extract({
  instruction: "Extract the product price from the payment widget",
  schema: z.object({
    price: z.string(),
  }),
  iframes: true,
});
```

```python Python
# Act within iframes
await page.act(
    "click the accept cookies button",
    iframes=True
)

# Observe within iframes
results = await page.observe({
    "instruction": "Find the primary action button",
    "iframes": True,
})

# Extract from iframes
data = await page.extract({
    "instruction": "Extract the product price from the payment widget",
    "schema": {
        "type": "object",
        "properties": {
            "price": {"type": "string"}
        }
    },
    "iframes": True,
})
```
</CodeGroup>

### Tips

- Iframes can increase processing time. For best performance, use the iframe option only when necessary.
- When you are unsure whether an element will be in an iframe, you can verify the presence of iframes in Stagehand logs.
- If an element intermittently fails to be found, it may be inside a lazy‑loaded iframe. Add small waits between steps or re‑run your action.

<Note>
You can enable experimental features (like Shadow DOM support) via your Stagehand configuration. See the [configuration guide](/v2/configuration/browser).
</Note>

## Next steps

<CardGroup cols={2}>
  <Card title="Analyze pages with observe()" icon="magnifying-glass" iconType="sharp-solid" href="/v2/basics/observe">
    Use `observe()` to plan precise, single-step actions before executing them.
  </Card>

  <Card title="Extract data with extract()" icon="table" iconType="sharp-solid" href="/v2/basics/extract">
    Use `extract()` with a data schema to pull clean, typed data from any page.
  </Card>

  <Card title="Caching actions" icon="bolt" iconType="sharp-solid" href="/v2/best-practices/caching">
    Speed up repeated automations by caching actions.
  </Card>

  <Card title="Act fundamentals" icon="arrow-pointer" iconType="sharp-solid" href="/v2/basics/act">
    Learn how to perform single-step actions reliably with `act()`.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/configuration/browser.mdx
================================================
---
title: Browser
sidebarTitle: Browser
description: Configure Stagehand on Browserbase or locally
---

Stagehand supports two primary environments:

- **Browserbase** - Cloud-managed browser infrastructure optimized for production web automation at scale
- **Local** - Run browsers directly on your machine for development and debugging

## Browserbase Environment

Browserbase provides managed cloud browser infrastructure optimized for web automation at scale. It offers advanced features like stealth mode, proxy support, and persistent contexts.

<Card icon="cloud" title="Browserbase" href="https://docs.browserbase.com" description="Explore the features and benefits of using Browserbase for scalable web automation.">
  Discover the power of cloud-managed browser infrastructure with Browserbase.
</Card>

### Environment Variables

Before getting started, set up the required environment variables:

<CodeGroup>
```bash .env
BROWSERBASE_API_KEY=your_api_key_here
BROWSERBASE_PROJECT_ID=your_project_id_here
```
</CodeGroup>

<Tip>
Get your API key and Project ID from the [Browserbase Dashboard](https://browserbase.com/overview)
</Tip>

### Using Stagehand with Browserbase

#### Basic Setup

The simplest way to get started is with default settings:

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
});

await stagehand.init();
```
```python Python
import os
from stagehand import Stagehand

stagehand = Stagehand(
    env="BROWSERBASE",
)

await stagehand.init()
```
</CodeGroup>

#### Advanced Configuration

Configure browser settings, proxy support, and other session parameters:
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  // Optional: API Key and Project ID will be pulled directly from your environment
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  browserbaseSessionCreateParams: {
    proxies: true,
    region: "us-west-2",
    browserSettings: {
      viewport: { width: 1920, height: 1080 },
      blockAds: true,
    },
  },
});

await stagehand.init();
console.log("Session ID:", stagehand.sessionId);
```
```python Python
import os
from stagehand import Stagehand

stagehand = Stagehand(
    env="BROWSERBASE",
    # Optional: API Key and Project ID will be pulled directly from your environment
    api_key=os.getenv("BROWSERBASE_API_KEY"),
    project_id=os.getenv("BROWSERBASE_PROJECT_ID"),
    browserbase_session_create_params={
        "proxies": True,
        "region": "us-west-2",
        "browser_settings": {
            "viewport": {"width": 1920, "height": 1080},
            "block_ads": True,
        },
    },
)
```
</CodeGroup>

<Accordion title="Advanced Browserbase Configuration Example">
    <CodeGroup>
    ```typescript TypeScript
    const stagehand = new Stagehand({
      env: "BROWSERBASE",
      apiKey: process.env.BROWSERBASE_API_KEY,
      projectId: process.env.BROWSERBASE_PROJECT_ID,
      browserbaseSessionCreateParams: {
        projectId: process.env.BROWSERBASE_PROJECT_ID!,
        proxies: true,
        region: "us-west-2",
        timeout: 3600, // 1 hour session timeout
        keepAlive: true, // Available on Startup plan
        browserSettings: {
          advancedStealth: false, // this is a Scale Plan feature - reach out to support@browserbase.com to enable
          blockAds: true,
          solveCaptchas: true,
          recordSession: false,
          viewport: {
            width: 1920,
            height: 1080,
          },
          fingerprint: {
            browsers: ["chrome", "edge"],
            devices: ["desktop"],
            operatingSystems: ["windows", "macos"],
            locales: ["en-US", "en-GB"],
            httpVersion: 2,
          },
        },
        userMetadata: {
          userId: "automation-user-123",
          environment: "production",
        },
      },
    });
    ```
    ```python Python
    stagehand = Stagehand(
        env="BROWSERBASE",
        api_key=os.getenv("BROWSERBASE_API_KEY"),
        project_id=os.getenv("BROWSERBASE_PROJECT_ID"),
        browserbase_session_create_params={
            "project_id": os.getenv("BROWSERBASE_PROJECT_ID"),
            "proxies": True,
            "region": "us-west-2",
            "timeout": 3600,  # 1 hour session timeout
            "keep_alive": True,  # Available on Startup plan
            "browser_settings": {
                "advanced_stealth": False,  # this is a Scale Plan feature - reach out to support@browserbase.com to enable
                "block_ads": True,
                "solve_captchas": True,
                "record_session": False,
                "viewport": {
                    "width": 1920,
                    "height": 1080,
                },
                "fingerprint": {
                    "browsers": ["chrome", "edge"],
                    "devices": ["desktop"],
                    "operating_systems": ["windows", "macos"],
                    "locales": ["en-US", "en-GB"],
                    "http_version": 2,
                },
            },
            "user_metadata": {
                "user_id": "automation-user-123",
                "environment": "production",
            },
        },
    )
    ```
</CodeGroup>
</Accordion>

#### Initialization Result
After calling `stagehand.init()`, the method returns configuration information about the initialized session:

<CodeGroup>
```typescript TypeScript
const result = await stagehand.init();
console.log(result);
```
```python Python
result = await stagehand.init()
print(result)
```
</CodeGroup>

The returned object contains:
```Example
{
  debugUrl: 'https://www.browserbase.com/devtools/inspector.html?wss=connect.browserbase.com/debug/f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0/devtools/page/5474B0E0510C5B6E629BEB06E799CD70?debug=true',
  sessionUrl: 'https://www.browserbase.com/sessions/f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0',
  sessionId: 'f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0'
}
```

<AccordionGroup>
<Accordion title="debugUrl">
**Open the Browserbase [session live view](https://docs.browserbase.com/features/session-live-view)** to include a human-in-the-loop.
</Accordion>

<Accordion title="sessionUrl">
**Open the [session replay](https://docs.browserbase.com/features/session-replay)** to see the full session recording. 
</Accordion>

<Accordion title="sessionId">
**Unique identifier** for the [Browserbase session](https://docs.browserbase.com/introduction/what-is-browserbase). This is used to identify the session in the Browserbase dashboard and to connect to the session.
</Accordion>
</AccordionGroup>

### Alternative: Browserbase SDK

If you prefer to manage sessions directly, you can use the Browserbase SDK:

<CodeGroup>
```typescript TypeScript
import { Browserbase } from "@browserbasehq/sdk";

const bb = new Browserbase({ 
  apiKey: process.env.BROWSERBASE_API_KEY! 
});

const session = await bb.sessions.create({
  projectId: process.env.BROWSERBASE_PROJECT_ID!,
  // Add configuration options here
});
```
```python Python
from browserbase import Browserbase

bb = Browserbase(api_key=os.environ["BROWSERBASE_API_KEY"])

session = bb.sessions.create(
    project_id=os.environ["BROWSERBASE_PROJECT_ID"],
    # Add configuration options here
)
```
</CodeGroup>

#### Connecting to an Existing Session

Connect to a previously created Browserbase session using its session ID:

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionID: "existing-session-uuid-here",
});

await stagehand.init();
console.log("Resumed Session ID:", stagehand.sessionId);
```
```python Python
import os
from stagehand import Stagehand

stagehand = Stagehand(
    env="BROWSERBASE",
    browserbase_session_id="existing-session-uuid-here",
)

await stagehand.init()
print(f"Resumed Session ID: {stagehand.session_id}")
```
</CodeGroup>

## Local Environment

The local environment runs browsers directly on your machine, providing full control over browser instances and configurations. Ideal for development, debugging, and scenarios requiring custom browser setups.

### Environment Comparison

| Feature | Browserbase | Local |
| --- | --- | --- |
| **Scalability** | High (cloud-managed) | Limited (local resources) |
| **Stealth Features** | Advanced fingerprinting | Basic stealth |
| **Proxy Support** | Built-in residential proxies | Manual configuration |
| **Session Persistence** | Cloud context storage | File-based user data |
| **Geographic Distribution** | Multi-region deployment | Single machine |
| **Debugging** | Session recordings & logs | Direct DevTools access |
| **Setup Complexity** | Environment variables only | Browser installation required |
| **Cost** | Usage-based pricing | Infrastructure & maintenance |
| **Best For** | Production, scale, compliance | Development, debugging |

### Basic Local Setup

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL"
});
  
await stagehand.init();
console.log("Session ID:", stagehand.sessionId);
```
```python Python
from stagehand import Stagehand

stagehand = Stagehand(
    env="LOCAL"
)

await stagehand.init()
print(f"Session ID: {stagehand.session_id}")
```
</CodeGroup>

### Advanced Local Configuration

Customize browser launch options for local development:

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    headless: false, // Show browser window
    devtools: true, // Open developer tools
    viewport: { width: 1280, height: 720 },
    executablePath: '/opt/google/chrome/chrome', // Custom Chrome path
    args: [
      '--no-sandbox',
      '--disable-setuid-sandbox',
      '--disable-web-security',
      '--allow-running-insecure-content',
    ],
    env: {
      NODE_ENV: "development",
      DEBUG: "true",
    },
  },
});

await stagehand.init();
```
```python Python
from stagehand import Stagehand

stagehand = Stagehand(
    env="LOCAL",
    headless=False,  # Show browser window
    local_browser_launch_options={
        "devtools": True,  # Open developer tools
        "viewport": {"width": 1280, "height": 720},
        "executable_path": "/opt/google/chrome/chrome",  # Custom Chrome path
        "args": [
            "--no-sandbox",
            "--disable-setuid-sandbox",
            "--disable-web-security",
            "--allow-running-insecure-content",
        ],
        "env": {
            "NODE_ENV": "development",
            "DEBUG": "true",
        },
    },
)

await stagehand.init()
```
</CodeGroup>

### Connecting to your local browser

Connect to your existing local Chrome/Chromium browser instead of launching a new one. This lets you automate your normal browser with all your existing tabs, extensions and settings.

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
	env: "LOCAL",
	localBrowserLaunchOptions: {
		cdpUrl: 'http://localhost:9222'
	}
});

await stagehand.init();
```
```python Python
from stagehand import Stagehand

stagehand = Stagehand(
    env="LOCAL",
    local_browser_launch_options={
      "cdp_url": "http://localhost:9222"
    }
)

await stagehand.init()
```
</CodeGroup>

## Troubleshooting

### Common Issues

<AccordionGroup>
<Accordion title="Browserbase Authentication Errors">
- Verify your `BROWSERBASE_API_KEY` and `BROWSERBASE_PROJECT_ID` are set correctly
- Check that your API key has the necessary permissions
- Ensure your Browserbase account has sufficient credits
</Accordion>

<Accordion title="Local Browser Launch Failures">
- Install Chrome or Chromium on your system
- Set the correct `executablePath` for your Chrome installation
- Check that required dependencies are installed (Linux: `libnss3-dev libatk-bridge2.0-dev libgtk-3-dev libxss1 libasound2`)
</Accordion>

<Accordion title="Session Timeout Issues">
- Increase session timeout in `browserbaseSessionCreateParams.timeout`
- Use `keepAlive: true` for long-running sessions
- Monitor session usage to avoid unexpected terminations
</Accordion>
</AccordionGroup>

================================================
FILE: packages/docs/v2/configuration/evals.mdx
================================================
---
title: Evaluations & Metrics
sidebarTitle: Evaluations
description: Monitor performance, optimize costs, and evaluate LLM effectiveness
---

Evaluations help you understand how well your automation performs, which models work best for your use cases, and how to optimize for cost and reliability. This guide covers both monitoring your own workflows and running comprehensive evaluations.

## Why Evaluations Matter

- **Performance Optimization**: Identify which models and settings work best for your specific automation tasks
- **Cost Control**: Track token usage and inference time to optimize spending
- **Reliability**: Measure success rates and identify failure patterns
- **Model Selection**: Compare different LLMs on real-world tasks to make informed decisions

<Card
  title="Live Model Comparisons"
  icon="scale-balanced"
  href="https://www.stagehand.dev/evals"
>
  View real-time performance comparisons across different LLMs on the [Stagehand Evals Dashboard](https://www.stagehand.dev/evals)
</Card>

## Comprehensive Evaluations

Evaluations help you systematically test and improve your automation workflows. Stagehand provides both built-in evaluations and tools to create your own.

We have 2 types of evals:
1. **Deterministic Evals** - These include unit tests, integration tests, and E2E tests that can be run without any LLM inference.
2. **LLM-based Evals** - These are evals that test the underlying functionality of Stagehand's AI primitives.


### Evals CLI
![Evals CLI](/media/evals-cli.png)

<Tip>
To run evals, you'll need to clone the [Stagehand repo](https://github.com/browserbase/stagehand) and set up the CLI.

We recommend using [Braintrust](https://www.braintrust.dev/docs/) to help visualize evals results and metrics.
</Tip>

The Stagehand CLI provides a powerful interface for running evaluations. You can run specific evals, categories, or external benchmarks with customizable settings.

Evals are grouped into:
1. **Act Evals** - These are evals that test the functionality of the `act` method.
2. **Extract Evals** - These are evals that test the functionality of the `extract` method.
3. **Observe Evals** - These are evals that test the functionality of the `observe` method.
4. **Combination Evals** - These are evals that test the functionality of the `act`, `extract`, and `observe` methods together.
5. **Experimental Evals** - These are experimental custom evals that test the functionality of the stagehand primitives.
6. **Agent Evals** - These are evals that test the functionality of `agent`.
7. **(NEW) External Benchmarks** - Run external benchmarks like WebBench, GAIA, WebVoyager, OnlineMind2Web, and OSWorld.

#### Installation

<Steps> 
<Step title="Install Dependencies">
```bash
# From the stagehand root directory
pnpm install
```
</Step>

<Step title="Build the CLI">
```bash
pnpm run build:cli
```
</Step>

<Step title="Verify Installation">
```bash
evals help
```
</Step>
</Steps>

#### CLI Commands and Options

##### Basic Commands

```bash
# Run all evals
evals run all

# Run specific category
evals run act
evals run extract
evals run observe
evals run agent

# Run specific eval
evals run extract/extract_text

# List available evals
evals list
evals list --detailed

# Configure defaults
evals config
evals config set env browserbase
evals config set trials 5
```

##### Command Options

- **`-e, --env`**: Environment (`local` or `browserbase`)
- **`-t, --trials`**: Number of trials per eval (default: 3)
- **`-c, --concurrency`**: Max parallel sessions (default: 10)
- **`-m, --model`**: Model override
- **`-p, --provider`**: Provider override
- **`--api`**: Use Stagehand API instead of SDK

##### Running External Benchmarks

The CLI supports several industry-standard benchmarks:

```bash
# WebBench with filters
evals run benchmark:webbench -l 10 -f difficulty=easy -f category=READ

# GAIA benchmark
evals run b:gaia -s 100 -l 25 -f level=1

# WebVoyager
evals run b:webvoyager -l 50

# OnlineMind2Web
evals run b:onlineMind2Web

# OSWorld
evals run b:osworld -f source=Mind2Web
```

#### Configuration Files

You can view the specific evals in [`evals/tasks`](https://github.com/browserbase/stagehand/tree/v2/evals/tasks). Each eval is grouped into eval categories based on [`evals/evals.config.json`](https://github.com/browserbase/stagehand/blob/main/evals/evals.config.json).


#### Viewing eval results
![Eval results](/images/evals.png)

Eval results are viewable on Braintrust. You can view the results of a specific eval by going to the Braintrust URL specified in the terminal when you run `npm run evals`.

By default, each eval will run five times per model. The "Exact Match" column shows the percentage of times the eval was correct. The "Error Rate" column shows the percentage of times the eval errored out.

You can use the Braintrust UI to filter by model/eval and aggregate results across all evals.

### Deterministic Evals

To run deterministic evals, you can run `npm run e2e` from within the Stagehand repo. This will test the functionality of Playwright within Stagehand to make sure it's working as expected.

These tests are in [`evals/deterministic`](https://github.com/browserbase/stagehand/tree/v2/evals/deterministic) and test on both Browserbase browsers and local headless Chromium browsers.

## Creating Custom Evaluations

### Step-by-Step Guide

<Steps>
<Step title="Create Evaluation File">
Create a new file in `evals/tasks/your-eval.ts`:

```typescript
import { EvalTask } from '../types';

export const customEvalTask: EvalTask = {
  name: 'custom_task_name',
  description: 'Test specific automation workflow',
  
  // Test setup
  setup: async ({ page }) => {
    await page.goto('https://example.com');
  },
  
  // The actual test
  task: async ({ stagehand, page }) => {
    // Your automation logic
    await page.act({ action: 'click the login button' });
    const result = await page.extract({ 
      instruction: 'Get the user name',
      schema: { username: 'string' }
    });
    return result;
  },
  
  // Validation
  validate: (result, expected) => {
    return result.username === expected.username;
  },
  
  // Test cases
  testCases: [
    {
      input: { /* test input */ },
      expected: { username: 'john_doe' }
    }
  ],
  
  // Evaluation criteria
  scoring: {
    exactMatch: true,
    timeout: 30000,
    retries: 2
  }
};
```
</Step>

<Step title="Add to Configuration">
Update `evals/evals.config.json`:

```json
{
  "categories": {
    "custom": ["custom_task_name"],
    "existing_category": ["custom_task_name"]
  }
}
```
</Step>

<Step title="Run Your Evaluation">
```bash
# Test your custom evaluation
evals run custom_task_name

# Run the entire custom category
evals run custom

# Run with specific settings
evals run custom_task_name -e browserbase -t 5 -m gpt-4o
```
</Step>
</Steps>


## Best Practices for Custom Evals

<AccordionGroup>
<Accordion title="Test Design Principles">
- **Atomic**: Each test should validate one specific capability
- **Deterministic**: Tests should produce consistent results
- **Realistic**: Use real-world scenarios and websites
- **Measurable**: Define clear success/failure criteria
</Accordion>

<Accordion title="Performance Optimization">
- **Parallel Execution**: Design tests to run independently
- **Resource Management**: Clean up after each test
- **Timeout Handling**: Set appropriate timeouts for operations
- **Error Recovery**: Handle failures gracefully
</Accordion>

<Accordion title="Data Quality">
- **Ground Truth**: Establish reliable expected outcomes
- **Edge Cases**: Test boundary conditions and error scenarios
- **Statistical Significance**: Run multiple iterations for reliability
- **Version Control**: Track changes to test cases over time
</Accordion>
</AccordionGroup>

### Troubleshooting Evaluations
<AccordionGroup>
<Accordion title="Evaluation Timeouts">
**Symptoms**: Tests fail with timeout errors

**Solutions**:
- Increase timeout in `taskConfig.ts`
- Use faster models (Gemini 2.5 Flash, GPT-4o Mini)
- Optimize test scenarios to be less complex
- Check network connectivity to LLM providers
</Accordion>

<Accordion title="Inconsistent Results">
**Symptoms**: Same test passes/fails randomly

**Solutions**:
- Set temperature to 0 for deterministic outputs
- Increase repetitions for statistical significance
- Use more capable models for complex tasks
- Check for dynamic website content affecting tests
</Accordion>

<Accordion title="High Evaluation Costs">
**Symptoms**: Token usage exceeding budget

**Solutions**:
- Use cost-effective models (Gemini 2.0 Flash, GPT-4o Mini)
- Reduce repetitions for initial testing
- Focus on specific evaluation categories
- Use local browser environment to reduce Browserbase costs
</Accordion>

<Accordion title="Braintrust Integration Issues">
**Symptoms**: Results not uploading to dashboard

**Solutions**:
- Check Braintrust API key configuration
- Verify internet connectivity
- Update Braintrust SDK to latest version
- Check project permissions in Braintrust dashboard
</Accordion>
</AccordionGroup>

================================================
FILE: packages/docs/v2/configuration/logging.mdx
================================================
---
title: Logging & Debugging
sidebarTitle: Logging
description: Set up logging, debugging, and error tracking for Stagehand workflows
---

Stagehand provides comprehensive logging capabilities to help you debug automation workflows, track execution, and diagnose issues. Configure logging levels, structured output, and debugging tools for both development and production environments.

## Logging Configuration

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE", // or "LOCAL"
  verbose: 1, // 0 = errors only, 1 = info, 2 = debug
});
```

```python Python
from stagehand import Stagehand

stagehand = Stagehand(
    env="BROWSERBASE",  # or "LOCAL"
    verbose=1,  # 0 = errors only, 1 = info, 2 = debug
)
```
</CodeGroup>

### Verbose Levels

- **Level 0**: Errors only - minimal output for production
- **Level 1**: Info - includes successful operations and important events
- **Level 2**: Debug - comprehensive logging including internal operations

## Structured Logging

### Log Line Format

Each log entry contains structured information:

<CodeGroup>
```typescript TypeScript
interface LogLine {
  category: 'browser' | 'action' | 'llm' | 'error' | 'stagehand' | 'cache';
  message: string;
  level: 0 | 1 | 2; // error | info | debug
  timestamp: string;
  auxiliary?: {
    executionTime?: { value: string; unit: string };
    sessionId?: string;
    url?: string;
    [key: string]: any;
  };
}
```

```python Python
# Log line structure in Python
{
  "category": "browser" | "action" | "llm" | "error" | "stagehand" | "cache",
  "message": str,
  "level": 0 | 1 | 2,  # error | info | debug
  "timestamp": str,
  "auxiliary": {
    "execution_time": {"value": str, "unit": str},
    "session_id": str,
    "url": str,
    # ... other context data
  }
}
```
</CodeGroup>

### Custom Logger

<CodeGroup>
```typescript TypeScript
class AdvancedLogger {
  private logFile?: string;
  
  constructor(logFile?: string) {
    this.logFile = logFile;
  }
  
  log = (logLine: any) => {
    const timestamp = new Date().toISOString();
    const colors = {
      browser: '\x1b[34m', // blue
      action: '\x1b[32m',  // green
      llm: '\x1b[35m',     // magenta
      error: '\x1b[31m',   // red
      stagehand: '\x1b[36m', // cyan
      cache: '\x1b[33m',   // yellow
    };
    
    const color = colors[logLine.category] || '\x1b[0m';
    const reset = '\x1b[0m';
    
    // Console output with colors
    console.log(`${color}[${logLine.category}]${reset} ${logLine.message}`);
    
    // Log execution time if available
    if (logLine.auxiliary?.executionTime) {
      console.log(` ${logLine.auxiliary.executionTime.value}${logLine.auxiliary.executionTime.unit}`);
    }
    
    // Log additional context
    if (logLine.auxiliary && Object.keys(logLine.auxiliary).length > 0) {
      console.log('  Context:', JSON.stringify(logLine.auxiliary, null, 2));
    }
    
    // File logging (optional)
    if (this.logFile) {
      const logEntry = {
        timestamp,
        ...logLine
      };
      require('fs').appendFileSync(this.logFile, JSON.stringify(logEntry) + '\n');
    }
  }
}

// Usage
const logger = new AdvancedLogger('./automation.log');
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  verbose: 2,
  logger: logger.log
});
```

```python Python
import json
import os
from datetime import datetime
from typing import Dict, Any, Optional

class AdvancedLogger:
    def __init__(self, log_file: Optional[str] = None):
        self.log_file = log_file
    
    def log(self, log_line: Dict[str, Any]):
        timestamp = datetime.now().isoformat()
        colors = {
            'browser': '\033[34m',   # blue
            'action': '\033[32m',    # green
            'llm': '\033[35m',       # magenta
            'error': '\033[31m',     # red
            'stagehand': '\033[36m', # cyan
            'cache': '\033[33m',     # yellow
        }
        
        color = colors.get(log_line.get('category', ''), '\033[0m')
        reset = '\033[0m'
        
        # Console output with colors
        print(f"{color}[{log_line.get('category')}]{reset} {log_line.get('message')}")
        
        # Log execution time if available
        if log_line.get('auxiliary', {}).get('execution_time'):
            exec_time = log_line['auxiliary']['execution_time']
            print(f"{exec_time['value']}{exec_time['unit']}")
        
        # Log additional context
        auxiliary = log_line.get('auxiliary', {})
        if auxiliary and len(auxiliary) > 0:
            print('  Context:', json.dumps(auxiliary, indent=2))
        
        # File logging (optional)
        if self.log_file:
            log_entry = {
                'timestamp': timestamp,
                **log_line
            }
            with open(self.log_file, 'a') as f:
                f.write(json.dumps(log_entry) + '\n')

# Usage
logger = AdvancedLogger('./automation.log')
stagehand = Stagehand(
    env="BROWSERBASE",
    verbose=2,
    logger=logger.log
)
```
</CodeGroup>

## Detailed Logging Features

### LLM Inference Logging

Enable detailed logging of all LLM interactions:

<CodeGroup>
```typescript TypeScript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  logInferenceToFile: true,  // Creates inference_summary/ directory
  verbose: 2
});
```

```python Python
stagehand = Stagehand(
    env="BROWSERBASE",
    log_inference_to_file=True,  # Creates inference_summary/ directory
    verbose=2
)
```
</CodeGroup>

The `inference_summary/` directory structure:
```
inference_summary/                   
├── act_summary/            
│   ├── 20240329_080446068.json    
│   ├── 20240329_080447019.json   
│   └── act_summary.json          
├── extract_summary/               
│   ├── 20240329_081205123.json    
│   └── extract_summary.json       
└── observe_summary/                
    ├── 20240329_081634891.json    
    └── observe_summary.json       
```

## Log Analysis & Debugging

### Common Log Patterns
<Tabs>
  <Tab title="Successful Action">
    ```json
    {
      "category": "action", 
      "message": "act completed successfully",
      "level": 1,
      "auxiliary": {
        "executionTime": {"value": "1250", "unit": "ms"},
        "url": "https://example.com",
        "sessionId": "session-123"
      }
    }
    ```
  </Tab>
  <Tab title="LLM Inference">
    ```json
    {
      "category": "llm",
      "message": "inference completed", 
      "level": 1,
      "auxiliary": {
        "model": "gpt-4o",
        "tokens": {"prompt": 3451, "completion": 45},
        "executionTime": {"value": "951", "unit": "ms"}
      }
    }
    ```
  </Tab>
  <Tab title="Error Example">
    ```json
    {
      "category": "action",
      "message": "action failed: element not found",
      "level": 0, 
      "auxiliary": {
        "selector": "button[data-testid='submit']",
        "url": "https://example.com/form",
        "sessionId": "session-123"
      }
    }
    ```
  </Tab>
</Tabs>

## Best Practices

<AccordionGroup>
<Accordion title="Development Environment">
- Use `verbose: 2` with visual debugging
- Enable browser DevTools for element inspection
- Use `logInferenceToFile: true` to capture LLM decisions
- Implement structured logging early
</Accordion>

<Accordion title="Production Environment">
- Use `verbose: 1` to balance visibility with performance
- Implement error tracking and alerting
- Use structured JSON logging
- Monitor session success rates and execution times
</Accordion>

<Accordion title="Security & Compliance">
- Never log credentials or sensitive data
- Implement log retention policies
- Secure log files and dashboards
</Accordion>
</AccordionGroup>

================================================
FILE: packages/docs/v2/configuration/models.mdx
================================================
---
title: Models
sidebarTitle: Models
description: Enhance Stagehand with LLMs for optimal performance, cost, and reliability
---

Stagehand uses Large Language Models (LLMs) to understand web pages, plan actions, and interact with complex interfaces. The choice of LLM significantly impacts your automation's accuracy, speed, and cost.

<Card title="Model Evaluation" href="https://www.stagehand.dev/evals" icon="paper-plane">
Find more details about how to choose the right model on our Model Evaluation page.
</Card>

## Why LLM Choice Matters

- **Accuracy**: Better models provide more reliable element detection and action planning
- **Speed**: Faster models reduce automation latency
- **Cost**: Different providers offer varying pricing structures
- **Reliability**: Structured output support ensures consistent automation behavior

<Tip>
Find more details about how to choose the right model on our [Model Evaluation](https://www.stagehand.dev/evals) page.
</Tip>

<Warning>
Small models on **Ollama** struggle with consistent structured outputs. While technically supported, we don't recommend them for production Stagehand workflows.
</Warning>

## Environment Variables Setup

Set up your API keys before configuring Stagehand:

<CodeGroup>
```bash .env
# Choose one or more providers
OPENAI_API_KEY=your_openai_key_here
ANTHROPIC_API_KEY=your_anthropic_key_here
GOOGLE_API_KEY=your_google_key_here
GROQ_API_KEY=your_groq_key_here
```
</CodeGroup>

## Supported Providers

Stagehand supports major LLM providers with structured output capabilities:

### Production-Ready Providers

| Provider | Best Models | Strengths | Use Case |
|----------|-------------|-----------|----------|
| **OpenAI** | `gpt-4.1`, `gpt-4.1-mini` | High accuracy, reliable | Production, complex sites |
| **Anthropic** | `claude-sonnet-4-6` | Excellent reasoning | Complex automation tasks |
| **Google** | `gemini-2.5-flash`, `gemini-2.5-pro` | Fast, cost-effective | High-volume automation |

### Additional Providers

<Expandable title="More Providers">
- **Groq** - `llama-3.3-70b-versatile` (Good for speed critical applications)
- **xAI** - `grok-beta` (Good for complex reasoning)
- **Azure** - Enterprise OpenAI deployment
- **Cerebras** - High-speed inference
- **TogetherAI** - Open-source models
- **Mistral** - `mixtral-8x7b-32768` (European option)
- **DeepSeek** - Cost-effective alternative
- **Perplexity** - Real-time web data
- **Ollama** - Local deployment (limited accuracy)
- **Run any model included in AI SDK** - Find supported models in the [Vercel AI SDK](https://sdk.vercel.ai/providers/ai-sdk-providers) (Follow the guide 
     [here](#vercel-ai-sdk) to get started.)
</Expandable>

## Basic Configuration

### Model Name Format

Stagehand uses the format `provider/model-name` for model specification.

**Examples:**
- OpenAI: `openai/gpt-4.1`
- Anthropic: `anthropic/claude-sonnet-4-6`
- Google: `google/gemini-2.5-flash` (Recommended)

### Quick Start Examples

<Tabs>
<Tab title="Google (Recommended)">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  modelName: "google/gemini-2.5-flash",
  modelClientOptions: {
    apiKey: process.env.GOOGLE_API_KEY,
  },
});
```
```python Python
import os
from stagehand import Stagehand

stagehand = Stagehand(
    model_name="google/gemini-2.5-flash",
    model_api_key=os.getenv("GOOGLE_API_KEY")
)
```
</CodeGroup>
</Tab>
<Tab title="OpenAI">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  modelName: "openai/gpt-4.1",
  modelClientOptions: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});
```
```python Python
import os
from stagehand import Stagehand

stagehand = Stagehand(
    model_name="openai/gpt-4.1",
    model_api_key=os.getenv("OPENAI_API_KEY")
)
```
</CodeGroup>
</Tab>

<Tab title="Anthropic">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  modelName: "anthropic/claude-sonnet-4-6",
  modelClientOptions: {
    apiKey: process.env.ANTHROPIC_API_KEY,
  },
});
```
```python Python
import os
from stagehand import Stagehand

stagehand = Stagehand(
    model_name="anthropic/claude-sonnet-4-6",
    model_api_key=os.getenv("ANTHROPIC_API_KEY")
)
```
</CodeGroup>
</Tab>
</Tabs>

## Custom LLM Integration

<Note>
Custom LLMs are currently only supported in TypeScript.
</Note>

Integrate any LLM with Stagehand using custom clients. The only requirement is **structured output support** for consistent automation behavior.

### Vercel AI SDK
The [Vercel AI SDK](https://sdk.vercel.ai/providers/ai-sdk-providers) is a popular library for interacting with LLMs. You can use any of the providers supported by the Vercel AI SDK to create a client for your model, **as long as they support structured outputs**.

Vercel AI SDK supports providers for OpenAI, Anthropic, and Google, along with support for **Amazon Bedrock** and **Azure OpenAI**.

To get started, you'll need to install the `ai` package and the provider you want to use. For example, to use Amazon Bedrock, you'll need to install the `@ai-sdk/amazon-bedrock` package.

You'll also need to use the [Vercel AI SDK external client](https://github.com/browserbase/stagehand/blob/v2/examples/external_clients/aisdk.ts) as a template to create a client for your model.

<Tabs>
	<Tab title="npm">
	```bash
	npm install ai @ai-sdk/amazon-bedrock
	```
	</Tab>

	<Tab title="pnpm">
	```bash
	pnpm install ai @ai-sdk/amazon-bedrock
	```
	</Tab>

	<Tab title="yarn">
	```bash
	yarn add ai @ai-sdk/amazon-bedrock
	```
	</Tab>
</Tabs>

To get started, you can use the [Vercel AI SDK external client](https://github.com/browserbase/stagehand/blob/84f810b4631291307a32a47addad7e26e9c1deb3/examples/external_clients/aisdk.ts) as a template to create a client for your model.

```ts
// Install/import the provider you want to use.
// For example, to use OpenAI, import `openai` from @ai-sdk/openai
import { bedrock } from "@ai-sdk/amazon-bedrock";
import { AISdkClient } from "./external_clients/aisdk";

const stagehand = new Stagehand({
  llmClient: new AISdkClient({
	model: bedrock("anthropic.claude-sonnet-4-6-v1:0"),
  }),
});
```

## Troubleshooting

### Common Issues

<AccordionGroup>
<Accordion title="Model doesn't support structured outputs">
**Error**: `Model does not support structured outputs`

**Solution**:
Use models that support function calling/structured outputs. The minimum requirements are:

- Model must support JSON/structured outputs
- Model must have strong reasoning capabilities
- Model must be able to handle complex instructions

For each provider, use their latest models that meet these requirements. Some examples:

- **OpenAI**: GPT-4 series or newer
- **Anthropic**: Claude 3 series or newer 
- **Google**: Gemini 2 series or newer
- **Other providers**: Latest models with structured output support

**Note**: Avoid base language models without structured output capabilities or fine-tuning for instruction following. When in doubt, check our [Model Evaluation](https://www.stagehand.dev/evals) page for up-to-date recommendations.
</Accordion>

<Accordion title="Authentication errors">
**Error**: `Invalid API key` or `Unauthorized`

**Solution**:
- Verify your environment variables are set correctly
- Check API key permissions and quotas
- Ensure you're using the correct API key for the provider
- For Anthropic, make sure you have access to the Claude API
</Accordion>

<Accordion title="Inconsistent automation results">
**Symptoms**: Actions work sometimes but fail other times

**Causes & Solutions**:
- **Weak models**: Use more capable models - check our [Model Evaluation](https://www.stagehand.dev/evals) page for current recommendations
- **High temperature**: Set temperature to 0 for deterministic outputs
- **Complex pages**: Switch to models with higher accuracy scores on our [Model Evaluation](https://www.stagehand.dev/evals) page
- **Rate limits**: Implement retry logic with exponential backoff
- **Context limits**: Reduce page complexity or use models with larger context windows
- **Prompt clarity**: Ensure your automation instructions are clear and specific
</Accordion>

<Accordion title="Slow performance">
**Issue**: Automation takes too long to respond

**Solutions**:
- **Use fast models**: Choose models optimized for speed
  - Any model with < 1s response time
  - Models with "fast" or "flash" variants
- **Optimize settings**: 
  - Use `verbose: 0` to minimize token usage
  - Set temperature to 0 for fastest processing
  - Keep max tokens as low as possible
- **Consider local deployment**: Local models can provide lowest latency
- **Batch operations**: Group multiple actions when possible
</Accordion>

<Accordion title="High costs">
**Issue**: LLM usage costs are too high

**Cost Optimization Strategies**:
1. **Switch to cost-effective models**: 
   - Check our [Model Evaluation](https://www.stagehand.dev/evals) page for current cost-performance benchmarks
   - Choose models with lower cost per token that still meet accuracy requirements
   - Consider models optimized for speed to reduce total runtime costs
2. **Optimize token usage**: 
   - Set `verbose: 0` to reduce logging overhead
   - Use concise prompts and limit response length
3. **Smart model selection**: Start with cheaper models, fallback to premium ones only when needed
4. **Cache responses**: Implement LLM response caching for repeated automation patterns
5. **Monitor usage**: Set up billing alerts and track costs per automation run
6. **Batch processing**: Process multiple similar tasks together
</Accordion>
</AccordionGroup>

### Next Steps
<CardGroup cols={2}>
<Card title="Choose Models" href="https://www.stagehand.dev/evals" icon="robot">
  See our Model Evaluation page
</Card>

<Card title="Test Models" href="/v2/configuration/evals" icon="flask-vial">
  Evaluate performance on your specific use cases in our Model Evaluation guide
</Card>

<Card title="Track Costs" href="/v2/configuration/observability" icon="chart-line">
  Monitor token usage and set alerts using our Observability tools
</Card>

<Card title="Cache Results" href="/v2/best-practices/caching" icon="database">
  Store successful patterns using our Caching Guide
</Card>
</CardGroup>

================================================
FILE: packages/docs/v2/configuration/observability.mdx
================================================
---
title: Observability
sidebarTitle: Observability
description: Track Stagehand automation with session visibility and analytics
---

Stagehand provides powerful observability features to help you monitor, track performance, and analyze your browser automation workflows. Focus on session monitoring, resource usage, and operational insights for both Browserbase and local environments.

## Browserbase Session Monitoring

When running on Browserbase, you gain access to comprehensive cloud-based monitoring and session management through the Browserbase API and dashboard.

<div style={{ textAlign: "center" }}>
  <img src="/media/observability.gif" alt="Browserbase Session Observability" width="400" />
</div>

### Live Session Visibility

Browserbase provides real-time visibility into your automation sessions:

**Session Dashboard Features**
- Real-time browser screen recording and replay
- Network request monitoring with detailed timing
- JavaScript console logs and error tracking
- CPU and memory usage metrics
- Session status and duration tracking

**Session Management & API Access**
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";
import { Browserbase } from "@browserbasehq/sdk";

const browserbase = new Browserbase({
  apiKey: process.env.BROWSERBASE_API_KEY,
});

const stagehand = new Stagehand({
  env: "BROWSERBASE"
});

await stagehand.init();

const sessionInfo = await browserbase.sessions.retrieve(stagehand.sessionId);

console.log("Session status:", sessionInfo.status);
console.log("Session region:", sessionInfo.region);
console.log("CPU usage:", sessionInfo.avgCpuUsage);
console.log("Memory usage:", sessionInfo.memoryUsage);
console.log("Proxy bytes:", sessionInfo.proxyBytes);
```

```python Python
import os
from stagehand import Stagehand
from browserbase import Browserbase

browserbase = Browserbase(
  api_key=os.getenv("BROWSERBASE_API_KEY"),
)

stagehand = Stagehand(
    env="BROWSERBASE",
)

await stagehand.init()

session_info = browserbase.sessions.retrieve(stagehand.session_id)

print(f"Session status: {session_info['status']}")
print(f"Session region: {session_info['region']}")
print(f"CPU usage: {session_info['avgCpuUsage']}")
print(f"Memory usage: {session_info['memoryUsage']}")
print(f"Proxy bytes: {session_info['proxyBytes']}")
```
</CodeGroup>

### Session Analytics & Insights

<CardGroup>
  <Card title="Real-Time Monitoring" icon="chart-line">
    Monitor live session status, resource usage, and geographic distribution. Scale and manage concurrent sessions with real-time insights.
  </Card>

  <Card title="Session Recordings" icon="video">
    Review complete session recordings with frame-by-frame playback. Analyze network requests and debug browser interactions visually.
  </Card>

  <Card title="API Management" icon="code">
    Programmatically access session data, automate lifecycle management, and integrate with monitoring systems through our API.
  </Card>

  <Card title="Usage Monitoring" icon="chart-bar">
    Track resource consumption, session duration, and API usage. Get detailed breakdowns of costs and utilization across your automation.
  </Card>
</CardGroup>

### Session Monitoring & Filtering

Query and monitor sessions by status and metadata:

<CodeGroup>
```typescript TypeScript
import { Browserbase } from "@browserbasehq/sdk";

const browserbase = new Browserbase({
  apiKey: process.env.BROWSERBASE_API_KEY,
});

// List sessions with filtering
async function getFilteredSessions() {
  const sessions = await browserbase.sessions.list({
    status: 'RUNNING'
  });
  
  return sessions.map(session => ({
    id: session.id,
    status: session.status, // RUNNING, COMPLETED, ERROR, TIMED_OUT
    startedAt: session.startedAt,
    endedAt: session.endedAt,
    region: session.region,
    avgCpuUsage: session.avgCpuUsage,
    memoryUsage: session.memoryUsage,
    proxyBytes: session.proxyBytes,
    userMetadata: session.userMetadata
  }));
}

// Query sessions by metadata
async function querySessionsByMetadata(query: string) {
  const sessions = await browserbase.sessions.list({
    q: query
  });
  
  return sessions;
}
```

```python Python
import os
from browserbase import Browserbase

browserbase = Browserbase(
    api_key=os.getenv("BROWSERBASE_API_KEY"),
)

def get_filtered_sessions():
    sessions = browserbase.sessions.list(status="RUNNING")
    
    return [{
        'id': session['id'],
        'status': session['status'],  # RUNNING, COMPLETED, ERROR, TIMED_OUT
        'started_at': session['startedAt'],
        'ended_at': session['endedAt'],
        'region': session['region'],
        'avg_cpu_usage': session['avgCpuUsage'],
        'memory_usage': session['memoryUsage'],
        'proxy_bytes': session['proxyBytes'],
        'user_metadata': session['userMetadata']
    } for session in sessions]

def query_sessions_by_metadata(query):
    sessions = browserbase.sessions.list(q=query)
    
    return sessions
```
</CodeGroup>

## Local Environment Monitoring

For local development, Stagehand provides performance monitoring and resource tracking capabilities directly on your machine.

### Performance Tracking

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  verbose: 1, // Monitor performance without debug noise
});

// Track local automation metrics
const startTime = Date.now();
const initialMetrics = stagehand.metrics;

// ... perform automation tasks

const finalMetrics = stagehand.metrics;
const executionTime = Date.now() - startTime;

console.log('Local Performance Summary:', {
  executionTime: `${executionTime}ms`,
  totalTokens: finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens,
  averageResponseTime: finalMetrics.totalInferenceTimeMs / 3, // Assuming 3 operations
  tokensPerSecond: (finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens) / (executionTime / 1000)
});
```

```python Python
from stagehand import Stagehand
import time

stagehand = Stagehand(
    env="LOCAL",
    verbose=1,  # Monitor performance without debug noise
)

# Track local automation metrics
start_time = time.time()
initial_metrics = stagehand.metrics

# ... perform automation tasks

final_metrics = stagehand.metrics
execution_time = (time.time() - start_time) * 1000  # Convert to ms

print('Local Performance Summary:', {
    'execution_time': f"{execution_time:.0f}ms",
    'total_tokens': final_metrics['total_prompt_tokens'] + final_metrics['total_completion_tokens'],
    'average_response_time': final_metrics['total_inference_time_ms'] / 3,  # Assuming 3 operations
    'tokens_per_second': (final_metrics['total_prompt_tokens'] + final_metrics['total_completion_tokens']) / (execution_time / 1000)
})
```
</CodeGroup>

## Resource Usage Monitoring

When running locally, monitor system resource usage and browser performance:

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";
import * as os from 'os';
import { performance } from 'perf_hooks';

class LocalResourceMonitor {
  private cpuUsage: number[] = [];
  private memoryUsage: number[] = [];
  
  startMonitoring() {
    const interval = setInterval(() => {
      // Track system resources
      const memUsage = process.memoryUsage();
      this.memoryUsage.push(memUsage.heapUsed / 1024 / 1024); // MB
      
      // Track CPU (simplified)
      const loadAvg = os.loadavg()[0];
      this.cpuUsage.push(loadAvg);
    }, 1000);
    
    return interval;
  }
  
  getResourceSummary() {
    return {
      avgMemoryUsage: this.memoryUsage.reduce((a, b) => a + b, 0) / this.memoryUsage.length,
      peakMemoryUsage: Math.max(...this.memoryUsage),
      avgCpuLoad: this.cpuUsage.reduce((a, b) => a + b, 0) / this.cpuUsage.length,
      totalDataPoints: this.cpuUsage.length
    };
  }
}

const monitor = new LocalResourceMonitor();
const interval = monitor.startMonitoring();

const stagehand = new Stagehand({ env: "LOCAL" });

// ... run automation

clearInterval(interval);
console.log('Resource Usage:', monitor.getResourceSummary());
```

```python Python
import psutil
import time
from typing import List
from stagehand import Stagehand

class LocalResourceMonitor:
    def __init__(self):
        self.cpu_usage: List[float] = []
        self.memory_usage: List[float] = []
        self.monitoring = False
    
    def start_monitoring(self):
        self.monitoring = True
        import threading
        
        def monitor_resources():
            while self.monitoring:
                # Track CPU and memory usage
                cpu_percent = psutil.cpu_percent(interval=1)
                memory_info = psutil.virtual_memory()
                
                self.cpu_usage.append(cpu_percent)
                self.memory_usage.append(memory_info.percent)
                
                time.sleep(1)
        
        thread = threading.Thread(target=monitor_resources)
        thread.daemon = True
        thread.start()
        return thread
    
    def stop_monitoring(self):
        self.monitoring = False
    
    def get_resource_summary(self):
        if not self.cpu_usage or not self.memory_usage:
            return {'error': 'No monitoring data collected'}
        
        return {
            'avg_cpu_usage': sum(self.cpu_usage) / len(self.cpu_usage),
            'peak_cpu_usage': max(self.cpu_usage),
            'avg_memory_usage': sum(self.memory_usage) / len(self.memory_usage),
            'peak_memory_usage': max(self.memory_usage),
            'total_data_points': len(self.cpu_usage)
        }

monitor = LocalResourceMonitor()
monitor.start_monitoring()

stagehand = Stagehand(env="LOCAL")

# ... run automation

monitor.stop_monitoring()
print('Resource Usage:', monitor.get_resource_summary())
```
</CodeGroup>


  <Card title="LLM Usage" icon="chart-line" href="/v2/configuration/evals">
    Monitor token usage, costs, and speed. Set up automated alerting for critical failures. Implement cost tracking across different environments. Use session analytics to optimize automation workflows.
  </Card>


## Real-Time Metrics & Monitoring

### Basic Usage Tracking

Monitor your automation's resource usage in real-time with `stagehand.metrics`:

<CodeGroup>
```typescript TypeScript
// Get current metrics
console.log(stagehand.metrics);

// Monitor during automation
const startTime = Date.now();
const initialMetrics = stagehand.metrics;

// ... perform automation tasks

const finalMetrics = stagehand.metrics;
const executionTime = Date.now() - startTime;

console.log('Automation Summary:', {
  totalTokens: finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens,
  totalCost: calculateCost(finalMetrics),
  executionTime,
  efficiency: (finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens) / executionTime
});
```

```python Python
# Get current metrics
print(stagehand.metrics)

# Monitor during automation
import time
start_time = time.time()
initial_metrics = stagehand.metrics

# ... perform automation tasks

final_metrics = stagehand.metrics
execution_time = (time.time() - start_time) * 1000  # Convert to ms

print('Automation Summary:', {
    'total_tokens': final_metrics['total_prompt_tokens'] + final_metrics['total_completion_tokens'],
    'total_cost': calculate_cost(final_metrics),
    'execution_time': execution_time,
    'efficiency': (final_metrics['total_prompt_tokens'] + final_metrics['total_completion_tokens']) / execution_time
})
```
</CodeGroup>

### Understanding Metrics Data

The metrics object provides detailed breakdown by Stagehand operation:

<CodeGroup>
```typescript TypeScript
{
  actPromptTokens: 4011,
  actCompletionTokens: 51,
  actInferenceTimeMs: 1688,

  extractPromptTokens: 4200,
  extractCompletionTokens: 243,
  extractInferenceTimeMs: 4297,

  observePromptTokens: 347,
  observeCompletionTokens: 43,
  observeInferenceTimeMs: 903,

  totalPromptTokens: 8558,
  totalCompletionTokens: 337,
  totalInferenceTimeMs: 6888
}
```

```python Python
{
  "act_prompt_tokens": 4011,
  "act_completion_tokens": 51,
  "act_inference_time_ms": 1688,

  "extract_prompt_tokens": 4200,
  "extract_completion_tokens": 243,
  "extract_inference_time_ms": 4297,

  "observe_prompt_tokens": 347,
  "observe_completion_tokens": 43,
  "observe_inference_time_ms": 903,

  "total_prompt_tokens": 8558,
  "total_completion_tokens": 337,
  "total_inference_time_ms": 6888
}
```
</CodeGroup>

### Log Inference to File

You can also log inference to a file by setting `logInferenceToFile` to `true`. This will create a directory called `inference_summary` in your project's root directory.
<CodeGroup>
```typescript TypeScript
const stagehand = new Stagehand({
  logInferenceToFile: true,    
});
```

```python Python
stagehand = Stagehand(
    log_inference_to_file=True,             
)
```
</CodeGroup>
The `inference_summary` directory provides granular analysis data:
```
inference_summary/
├── act_summary/
│   ├── {timestamp}.json
│   ├── {timestamp}.json
│   └── ...
│   └── act_summary.json
├── extract_summary/
│   ├── {timestamp}.json
│   ├── {timestamp}.json
│   └── ...
│   └── extract_summary.json
├── observe_summary/
│   ├── {timestamp}.json
│   ├── {timestamp}.json
│   └── ...
│   └── observe_summary.json
```

### Log File Structure

Each operation creates detailed logs for analysis:
```typescript
{
  "act_summary": [
    {
      "act_inference_type": "act",
      "timestamp": "20250329_080446068",
      "LLM_input_file": "20250329_080446068_act_call.txt",
      "LLM_output_file": "20250329_080447019_act_response.txt",
      "prompt_tokens": 3451,
      "completion_tokens": 45,
      "inference_time_ms": 951
    },
    ...
  ],
}
```


## Best Practices

<AccordionGroup>
<Accordion title="Production Monitoring">
- Track session success rates and failure patterns
- Monitor resource usage and scaling requirements
- Set up automated alerting for critical failures
- Implement cost tracking across different environments
- Use session analytics to optimize automation workflows
</Accordion>

<Accordion title="Performance Optimization">
- Compare Browserbase vs local execution times
- Monitor token usage and inference costs across models
- Track geographic performance differences
- Identify bottlenecks in automation workflows
- Optimize for cost-effectiveness and speed
</Accordion>

<Accordion title="Operational Insights">
- Track session distribution across regions
- Monitor concurrent session limits and scaling
- Analyze failure patterns and common error scenarios
- Use session recordings for root cause analysis
- Implement custom metadata for workflow categorization
</Accordion>

<Accordion title="Integration & Alerting">
- Integrate session APIs with monitoring dashboards
- Set up automated notifications for session failures  
- Track SLA compliance and performance benchmarks
- Monitor resource costs and usage patterns
- Use analytics data for capacity planning and optimization
</Accordion>
</AccordionGroup>

For detailed logging and debugging capabilities, see [Logging](/v2/configuration/logging).

================================================
FILE: packages/docs/v2/first-steps/ai-rules.mdx
================================================
---
title: AI Rules
description: Using AI to write Stagehand code faster, and better.
---

You're likely using AI to write code, and there's a **right and wrong way to do it.** This page is a collection of rules, configs, and copy‑paste snippets to allow your AI agents/assistants to write performant, Stagehand code as fast as possible. 

## Quickstart

<CardGroup cols={2}>
  <Card title="Add MCP servers" icon="screwdriver-wrench">
    Configure Browserbase (Stagehand), Context7, DeepWiki, and Stagehand Docs in your MCP client. 
  </Card>
  <Card title="Pin editor rules" icon="memo">
    Drop in `cursorrules` and `claude.md` so AI agents/assistants always emit Stagehand patterns. 
  </Card>
</CardGroup>

## Using MCP Servers

MCP (Model Context Protocol) servers act as intermediaries that connect AI systems to external data sources and tools. These servers enable your coding assistant to access real-time information, execute tasks, and retrieve structured data to enhance code generation accuracy.

The following **MCP servers** provide specialized access to Stagehand documentation and related resources:

<Accordion title="Context7 by Upstash" icon="database">
Provides semantic search across documentation and codebase context. Context7 enables AI assistants to find relevant code patterns, examples, and implementation details from your project history. It maintains contextual understanding of your development workflow and can surface related solutions from previous work.

**Installation:**
```json
{
  "mcpServers": {
    "context7": {
      "command": "npx",
      "args": ["-y", "@upstash/context7-mcp"]
    }
  }
}
```
</Accordion>

<Accordion title="DeepWiki by Cognition" icon="book-open">
Offers deep indexing of GitHub repositories and documentation. DeepWiki allows AI agents to understand project architecture, API references, and best practices from the entire Stagehand ecosystem. It provides comprehensive knowledge about repository structure, code relationships, and development patterns.

**Installation:**
```json
{
  "mcpServers": {
    "deepwiki": {
      "url": "https://mcp.deepwiki.com/mcp"
    }
  }
}
```
</Accordion>

<Accordion title="Stagehand Docs by Mintlify" icon="mintbit">
Direct access to official Stagehand documentation. This MCP server provides AI assistants with up-to-date API references, configuration options, and usage examples for accurate code generation. Mintlify auto-generates this server from the official docs, ensuring your AI assistant always has the latest information.

**Usage:**
```json
{
  "mcpServers": {
    "stagehand-docs": {
      "url": "https://docs.stagehand.dev/mcp"
    }
  }
}
```
</Accordion>

**How MCP Servers Enhance Your Development:**
- **Real-time Documentation Access**: AI assistants can query the latest Stagehand docs, examples, and best practices
- **Context-Aware Code Generation**: Servers provide relevant code patterns and configurations based on your specific use case
- **Reduced Integration Overhead**: Standardized protocol eliminates the need for custom integrations with each documentation source
- **Enhanced Accuracy**: AI agents receive structured, up-to-date information rather than relying on potentially outdated training data


<Tip>
**Prompting tip:** 
Explicitly ask your coding agent/assistant to use these MCP servers to fetch relevant information from the docs so they have better context and know how to write proper Stagehand code. 

ie. **"Use the stagehand-docs MCP to fetch the act/observe guidelines, then generate code that follows them. Prefer cached observe results."**
</Tip>


## Editor rule files (copy‑paste)

Drop these in `.cursorrules`, `windsurfrules`, `claude.md`, or any agent rule framework:

<Accordion title="TypeScript">

``````md
# Stagehand Project

This is a project that uses [Stagehand](https://github.com/browserbase/stagehand), which amplifies Playwright with AI-powered `act`, `extract`, and `observe` methods added to the Page class.

`Stagehand` is a class that provides configuration and browser automation capabilities with:
- `stagehand.page`: A StagehandPage object (extends Playwright Page)
- `stagehand.context`: A StagehandContext object (extends Playwright BrowserContext)
- `stagehand.agent()`: Create AI-powered agents for autonomous multi-step workflows
- `stagehand.init()`: Initialize the browser session
- `stagehand.close()`: Clean up resources

`Page` extends Playwright's Page class with AI-powered methods:
- `act()`: Perform actions on web elements using natural language
- `extract()`: Extract structured data from pages using schemas
- `observe()`: Plan actions and get selectors before executing

`Agent` provides autonomous Computer Use Agent capabilities:
- `execute()`: Perform complex multi-step tasks using natural language instructions

`Context` extends Playwright's BrowserContext class for browser session management.

Use the following rules to write code for this project.

- To plan an instruction like "click the sign in button", use Stagehand `observe` to get the action to execute.

```typescript
const results = await page.observe("Click the sign in button");
```

You can also pass in the following params:

```typescript
await page.observe({
  instruction: "the instruction to execute",
  returnAction: true 
});
```

- The result of `observe` is an array of `ObserveResult` objects that can directly be used as params for `act` like this:
  ```typescript
  const results = await page.observe({
    instruction: "the instruction to execute",
    returnAction: true, // return the action to execute
  });

  await page.act(results[0]);
  ```
  
- When writing code that needs to extract data from the page, use Stagehand `extract`. Explicitly pass the following params by default:

```typescript
const { someValue } = await page.extract({
  instruction: "the instruction to execute",
  schema: z.object({
    someValue: z.string(),
  }), // The schema to extract
});
```

## Initialize

```typescript
import { Stagehand, Page, BrowserContext } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE"
});

await stagehand.init();

const page = stagehand.page; // Playwright Page with act, extract, and observe methods

const context = stagehand.context; // Playwright BrowserContext
```
### Configuration Options
```typescript
const StagehandConfig = {
  env: "BROWSERBASE" | "LOCAL", // Environment to run in
  apiKey: process.env.BROWSERBASE_API_KEY, // Browserbase API key
  projectId: process.env.BROWSERBASE_PROJECT_ID, // Browserbase project ID
  debugDom: true, // Enable DOM debugging features
  headless: false, // Run browser in headless mode
  domSettleTimeoutMs: 30_000, // Timeout for DOM to settle
  enableCaching: true, // Enable action caching
  modelName: "gpt-4o", // AI model to use
  modelClientOptions: {
    apiKey: process.env.OPENAI_API_KEY, // OpenAI API key
  },
};
```
## Act

You can act directly with string instructions:

```typescript
await page.act("Click the sign in button");
```

Use variables for dynamic form filling:

```typescript
await page.act({
  action: `Enter the following information:
    Name: %name%
    Email: %email%
    Phone: %phone%`,
  variables: {
    name: "John Doe",
    email: "john@example.com", 
    phone: "+1-555-0123"
  }
});
```

**Best Practices:**
- Cache the results of `observe` to avoid unexpected DOM changes
- Keep actions atomic and specific (e.g., "Click the sign in button" not "Sign in to the website")
- Use variable substitution for dynamic data entry

Act `action` should be as atomic and specific as possible, i.e. "Click the sign in button" or "Type 'hello' into the search input".
AVOID actions that are more than one step, i.e. "Order me pizza" or "Send an email to Paul asking him to call me".

## Extract

### Simple String Extraction

```typescript
const signInButtonText = await page.extract("extract the sign in button text");
```

### Structured Extraction with Schema (Recommended)

Always use Zod schemas for structured data extraction:

```typescript
import { z } from "zod/v3";

const data = await page.extract({
  instruction: "extract the sign in button text",
  schema: z.object({
    text: z.string(),
  }),
});
```

### Array Extraction

To extract multiple items, wrap the array in a single object:

```typescript
const data = await page.extract({
  instruction: "extract the text inside all buttons",
  schema: z.object({
    buttons: z.array(z.string()),
  })
});
```

### Complex Object Extraction

For more complex data structures:

```typescript
const productData = await page.extract({
  instruction: "extract product information from this page",
  schema: z.object({
    title: z.string(),
    price: z.number(),
    description: z.string(),
    features: z.array(z.string()),
    availability: z.boolean(),
  }),
});
```

### Schema Validation

```typescript
import { validateZodSchema } from "./utils.js";
import { z } from "zod/v3";

const schema = z.object({ name: z.string() });
const isValid = validateZodSchema(schema, { name: "John" }); // true
```

## Agent System

Stagehand provides an Agent System for autonomous web browsing using Computer Use Agents (CUA). Agents execute multi-step workflows using natural language instructions.

### Creating Agents

```typescript
// Basic agent (default)
const agent = stagehand.agent();

// OpenAI agent
const agent = stagehand.agent({
  provider: "openai",
  model: "computer-use-preview",
  instructions: "You are a helpful assistant that can use a web browser.",
  options: { 
    apiKey: process.env.OPENAI_API_KEY 
  }
});

// Anthropic agent
const agent = stagehand.agent({
  provider: "anthropic", 
  model: "claude-sonnet-4-20250514",
  instructions: "You are a helpful assistant that can use a web browser.",
  options: { 
    apiKey: process.env.ANTHROPIC_API_KEY 
  }
});
```
### Agent Execution
```typescript
// Simple task
const result = await agent.execute("Extract the title from this webpage");

// Complex multi-step task
const result = await agent.execute({
  instruction: "Apply for the first engineer position with mock data",
  maxSteps: 20,
  autoScreenshot: true
});
```

### Best Practices
- Be specific with instructions: `"Fill out the contact form with name 'John Doe' and submit it"`
- Break down complex tasks into smaller steps
- Use error handling with try/catch blocks
- Combine agents for navigation with traditional methods for precise data extraction

```typescript
// Good: Specific instructions
await agent.execute("Navigate to products page and filter by 'Electronics'");

// Avoid: Vague instructions  
await agent.execute("Do some stuff on this page");
```

## Project Structure Best Practices

- Store configurations in `stagehand.config.ts`
- Use environment variables for API keys (see `.env.example`)
- Implement main automation logic in functions that accept `{ page, context, stagehand }`
- Use TypeScript with proper imports from `@browserbasehq/stagehand`
``````

</Accordion>

<Accordion title="Python">

``````md
# Stagehand Python Project

This is a project that uses [Stagehand Python](https://github.com/browserbase/stagehand-python), which provides AI-powered browser automation with `act`, `extract`, and `observe` methods.

`Stagehand` is a class that provides configuration and browser automation capabilities with:
- `stagehand.page`: A StagehandPage object (extends Playwright Page)
- `stagehand.context`: A StagehandContext object (extends Playwright BrowserContext)
- `stagehand.agent()`: Create AI-powered agents for autonomous multi-step workflows
- `stagehand.init()`: Initialize the browser session
- `stagehand.close()`: Clean up resources

`Page` extends Playwright's Page class with AI-powered methods:
- `act()`: Perform actions on web elements using natural language
- `extract()`: Extract structured data from pages using schemas
- `observe()`: Plan actions and get selectors before executing

`Agent` provides autonomous Computer Use Agent capabilities:
- `execute()`: Perform complex multi-step tasks using natural language instructions

Use the following rules to write code for this project.

- To plan an instruction like "click the sign in button", use Stagehand `observe` to get the action to execute.

```python
results = await page.observe("Click the sign in button")
```

You can also pass in the following params:

```python
await page.observe(
    instruction="the instruction to execute",
    draw_overlay=True  # Show visual overlay on observed elements
)
```

- The result of `observe` is a list of `ObserveResult` objects that can directly be used as params for `act` like this:
  ```python
  results = await page.observe("Click the sign in button")
  await page.act(results[0])
  ```
- When writing code that needs to extract data from the page, use Stagehand `extract`. Use Pydantic models for schemas:

```python
from pydantic import BaseModel

class ExtractedData(BaseModel):
    some_value: str

result = await page.extract(
    instruction="the instruction to execute",
    schema=ExtractedData
)
```

## Initialize

```python
from stagehand import Stagehand, StagehandConfig
import asyncio
import os
from dotenv import load_dotenv

load_dotenv()

async def main():
    config = StagehandConfig(
        env="BROWSERBASE",  # or "LOCAL"
        api_key=os.getenv("BROWSERBASE_API_KEY"),
        project_id=os.getenv("BROWSERBASE_PROJECT_ID"),
        model_name="google/gemini-2.5-flash-preview-05-20",
        model_api_key=os.getenv("MODEL_API_KEY"),
    )
    
    # Recommended: Use as async context manager
    async with Stagehand(config) as stagehand:
        page = stagehand.page
        # Your automation code here
        
    # Alternative: Manual initialization
    stagehand = Stagehand(config)
    await stagehand.init()
    page = stagehand.page
    # Your automation code here
    await stagehand.close()

if __name__ == "__main__":
    asyncio.run(main())
```

### Configuration Options

Key configuration options in `StagehandConfig`:

```python
config = StagehandConfig(
    env="BROWSERBASE",  # or "LOCAL"
    api_key=os.getenv("BROWSERBASE_API_KEY"),
    project_id=os.getenv("BROWSERBASE_PROJECT_ID"),
    model_name="google/gemini-2.5-flash-preview-05-20",
    model_api_key=os.getenv("MODEL_API_KEY"),
    verbose=1,  # 0=minimal, 1=medium, 2=detailed
    dom_settle_timeout_ms=30000,
    self_heal=True,  # Enable self-healing functionality
)
```

## Act

You can act directly with string instructions:

```python
await page.act("Click the sign in button")
```

Use variables for dynamic form filling:

```python
await page.act(
    "Enter the following information: Name: John Doe, Email: john@example.com"
)
```

**Best Practices:**
- Cache the results of `observe` to avoid unexpected DOM changes
- Keep actions atomic and specific (e.g., "Click the sign in button" not "Sign in to the website")
- Use specific, descriptive instructions

Act `action` should be as atomic and specific as possible, i.e. "Click the sign in button" or "Type 'hello' into the search input".
AVOID actions that are more than one step, i.e. "Order me pizza" or "Send an email to Paul asking him to call me".

## Extract

### Simple String Extraction
```python
sign_in_button_text = await page.extract("extract the sign in button text")
```

### Structured Extraction with Schema (Recommended)
Always use Pydantic models for structured data extraction:

```python
from pydantic import BaseModel, Field
from typing import List

class ButtonData(BaseModel):
    text: str = Field(..., description="Button text content")

data = await page.extract(
    instruction="extract the sign in button text",
    schema=ButtonData
)
```

### Array Extraction
For arrays, use List types:

```python
from pydantic import BaseModel, Field
from typing import List

class ButtonsData(BaseModel):
    buttons: List[str] = Field(..., description="List of button texts")

data = await page.extract(
    instruction="extract the text inside all buttons",
    schema=ButtonsData
)
```

### Complex Object Extraction
For more complex data structures:

```python
from pydantic import BaseModel, Field
from typing import List

class Company(BaseModel):
    name: str = Field(..., description="Company name")
    description: str = Field(..., description="Brief company description")

class Companies(BaseModel):
    companies: List[Company] = Field(..., description="List of companies")

companies_data = await page.extract(
    "Extract names and descriptions of 5 companies",
    schema=Companies
)
```

## Agent System

Stagehand provides an Agent System for autonomous web browsing using Computer Use Agents (CUA).

### Creating Agents

```python
# Basic agent (uses default model)
agent = stagehand.agent()

# OpenAI agent
agent = stagehand.agent(
    model="computer-use-preview",
    instructions="You are a helpful web navigation assistant.",
    options={"apiKey": os.getenv("OPENAI_API_KEY")}
)

# Anthropic agent
agent = stagehand.agent(
    model="claude-sonnet-4-20250514",
    instructions="You are a helpful web navigation assistant.",
    options={"apiKey": os.getenv("ANTHROPIC_API_KEY")}
)
```

### Agent Execution

```python
# Simple task
result = await agent.execute("Play a game of 2048")

# Complex multi-step task with options
result = await agent.execute(
    instruction="Apply for the first engineer position with mock data",
    max_steps=20,
    auto_screenshot=True,
    wait_between_actions=1000  # milliseconds
)
```

**Best Practices:**
- Be specific with instructions: `"Fill out the contact form with name 'John Doe' and submit it"`
- Break down complex tasks into smaller steps
- Use error handling with try/except blocks
- Combine agents for navigation with traditional methods for precise data extraction

```python
# Good: Specific instructions
await agent.execute("Navigate to products page and filter by 'Electronics'")

# Avoid: Vague instructions
await agent.execute("Do some stuff on this page")
```

## Project Structure Best Practices

- Store configurations in environment variables or config files
- Use async/await patterns consistently
- Implement main automation logic in async functions
- Use async context managers for resource management
- Use type hints and Pydantic models for data validation
- Handle exceptions appropriately with try/except blocks
``````

</Accordion>

## Security notes

- Do not embed secrets in docs or rule files; use env vars in MCP configs.
- Avoid broad actions that may trigger unintended navigation; prefer `observe` first.

## Resources/references

- Context7 MCP (Upstash)
  - https://github.com/upstash/context7
- DeepWiki MCP
  - https://mcp.deepwiki.com/
- Stagehand Docs MCP (Mintlify)
  - https://docs.stagehand.dev/mcp


================================================
FILE: packages/docs/v2/first-steps/installation.mdx
================================================
---
title: Installation
description: Integrate Stagehand into an existing project.
---

Install Stagehand in your current app with the TypeScript or Python SDK.

<Tip>
For TypeScript/Node.js: We highly recommend using the Node.js runtime environment to run Stagehand scripts, as opposed to newer alternatives like Deno or Bun. 

**Bun does not support Stagehand** since it doesn't support [Playwright](https://github.com/search?q=repo:oven-sh/bun+playwright&type=issues).

For Python: We require Python 3.9+ and recommend using [uv](https://docs.astral.sh/uv/) to manage your virtual environment.
</Tip>

<Tabs>
<Tab title="TypeScript">

### Install dependencies

<CodeGroup>
```bash npm
npm install @browserbasehq/stagehand playwright zod
```

```bash pnpm
pnpm add @browserbasehq/stagehand playwright zod
```

```bash yarn
yarn add @browserbasehq/stagehand playwright zod
```
</CodeGroup>

<Tip>
If you plan to run locally, install browsers once: `npx playwright install`.
For cloud browser sessions, skip this.
</Tip>

### Configure environment

Set environment variables (or a `.env` via your framework):

<CodeGroup>
```bash Bash
OPENAI_API_KEY=your_api_key
BROWSERBASE_API_KEY=your_api_key
BROWSERBASE_PROJECT_ID=your_project_id
```
</CodeGroup>

### Use in your codebase

Add Stagehand where you need browser automation.

<CodeGroup>
```typescript TypeScript
import "dotenv/config";
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod/v3";

async function main() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE"
  });

  await stagehand.init();
  const page = stagehand.page;

  await page.goto("https://example.com");
  
  // Act on the page
  await page.act("Click the sign in button");
  
  // Extract structured data
  const { title } = await page.extract({
    instruction: "extract the page title",
    schema: z.object({
      title: z.string(),
    }),
  });

  console.log(title);
  await stagehand.close();
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});
```
</CodeGroup>

</Tab>

<Tab title="Python">

### Add dependencies

<CodeGroup>

```bash uv
uv add stagehand
```

```bash pip
pip install stagehand
```

</CodeGroup>

### Configure environment

Set environment variables (or a `.env` via your framework):

<CodeGroup>
```bash Bash
MODEL_API_KEY=your_api_key
BROWSERBASE_API_KEY=your_api_key
BROWSERBASE_PROJECT_ID=your_project_id
```
</CodeGroup>

### Use in your codebase

<CodeGroup>
```python Python
import os
import asyncio
from stagehand import Stagehand

async def main():
    stagehand = Stagehand(
        env="BROWSERBASE",
        model_api_key=os.getenv("MODEL_API_KEY")
    )
    await stagehand.init()
    page = stagehand.page
    
    await page.goto("https://example.com")
    
    # Act on the page
    await page.act("Click the sign in button")
    
    # Extract structured data
    result = await page.extract({
        "instruction": "extract the page title",
        "schema": {
            "title": {
                "type": "string"
            }
        }
    })
    
    print(result["title"])
    await stagehand.close()

if __name__ == "__main__":
    asyncio.run(main())
```
</CodeGroup>

</Tab>

</Tabs>

## Next steps

<CardGroup cols={2}>
  <Card 
    title="Configuration"
    icon="gear"
    href="/v2/configuration/browser"
  >
    Environment, Browserbase vs Local, logging, timeouts, LLM customization
  </Card>
  <Card 
    title="Act"
    icon="arrow-pointer"
    href="/v2/basics/act"
  >
    Perform precise actions with natural language
  </Card>
  <Card 
    title="Extract"
    icon="download"
    href="/v2/basics/extract"
  >
    Typed data extraction with Zod schemas
  </Card>
  <Card 
    title="Observe"
    icon="eye"
    href="/v2/basics/observe"
  >
    Discover elements and suggested actions
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/first-steps/introduction.mdx
================================================
---
title: Introducing Stagehand
sidebarTitle: Introduction
description: Developers use Stagehand to reliably automate the web.
---

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## The Problem with Browser Automation

Traditional frameworks like Playwright and Puppeteer force you to write brittle scripts that break with every UI change. Web agents promise to solve this with AI, but leave you at the mercy of unpredictable behavior.

**You're stuck between two bad options:**
- **Too brittle**: Traditional selectors break when websites change
- **Too agentic**: AI agents are unpredictable and impossible to debug

## Enter Stagehand

Stagehand gives you the best of both worlds through four powerful primitives that let you choose exactly how much AI to use:

<CardGroup cols={2}>
  <Card title="Act" icon="play" href="/v2/basics/act">
    Execute actions using natural language
  </Card>
  <Card title="Extract" icon="database" href="/v2/basics/extract">
    Pull structured data with schemas
  </Card>
  <Card title="Observe" icon="eye" href="/v2/basics/observe">
    Discover available actions on any page
  </Card>
  <Card title="Agent" icon="robot" href="/v2/basics/agent">
    Automate entire workflows autonomously
  </Card>
</CardGroup>

<CodeGroup>
```typescript TypeScript
// Act - Execute natural language actions
await page.act("click the login button");

// Extract - Pull structured data
const { price } = await page.extract({
  schema: z.object({ price: z.number() })
});

// Observe - Discover available actions
const actions = await page.observe("find submit buttons");

// Agent - Automate entire workflows
const agent = stagehand.agent({
    provider: "anthropic",
    model: "claude-sonnet-4-20250514",
    options: {
      apiKey: process.env.ANTHROPIC_API_KEY,
    },
})
await agent.execute("apply for this job");
```
```python Python
# Act - Execute natural language actions
await page.act("click the login button")

# Extract - Pull structured data
result = await page.extract(
  schema={"price": float}
)

# Observe - Discover available actions
actions = await page.observe("find submit buttons")

# Agent - Automate entire workflows
await agent.execute("apply for this job")
```
</CodeGroup>


## Why Developers Choose Stagehand

- **Precise Control**: Mix AI-powered actions with deterministic code. You decide exactly how much AI to use.

- **Actually Repeatable**: Save and replay actions exactly. No more "it worked on my machine" with browser automations.

- **Maintainable at Scale**: One script can automate multiple websites. When sites change, your automations adapt.

- **Composable Tools**: Choose your level of automation with Act, Extract, Observe, and Agent.

## Built for Modern Development
Stagehand is designed for developers building production browser automations and AI agents that need reliable web access.

<AccordionGroup>
  <Accordion title="Full Playwright Compatibility">
    Use any Playwright API alongside Stagehand. You're never locked into our abstractions.
  </Accordion>
  <Accordion title="TypeScript & Python SDKs">
    First-class support for both ecosystems with type safety and IDE autocomplete.
  </Accordion>
  <Accordion title="Works Everywhere">
    Compatible with all Chromium-based browsers: Chrome, Edge, Arc, Brave, and more.
  </Accordion>
  <Accordion title="Built by Browserbase">
    Created and maintained by the team behind enterprise browser infrastructure.
  </Accordion>
</AccordionGroup>

## Get Started in 60 Seconds
<Info>
  **Pro tip**: For best results, we recommend using Stagehand with [Browserbase](https://www.browserbase.com) for reliable cloud browser infrastructure.
</Info>
<CardGroup cols={2}>
  <Card
    title="Quickstart"
    icon="rocket"
    href="/v2/first-steps/quickstart"
  >
    Build your first automation in under a minute
  </Card>
  <Card
    title="Try Director"
    icon="wand-magic-sparkles"
    href="https://www.director.ai"
  >
    Generate Stagehand scripts with AI
  </Card>
  <Card
    title="View Templates"
    icon="code"
    href="https://www.browserbase.com/templates"
  >
    See real-world automation examples
  </Card>
  <Card
    title="Join Discord"
    icon="discord"
    href="https://stagehand.dev/discord"
  >
    Get help from the community
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v2/first-steps/quickstart.mdx
================================================
---
title: Quickstart
description: 'Stagehand allows you to build web automations with natural language and code.'
---

If this is your **first time using Stagehand**, you should try [Director](https://director.ai) first. It's an agent that allows you to build Stagehand workflows using natural language. You can also try Stagehand using our [MCP server](/v2/integrations/mcp/introduction).

Otherwise, the quickest way to start with Stagehand is with our CLI. It scaffolds a ready‑to‑run Stagehand app with sensible defaults, and an example script.

<Note>
This quickstart is for **TypeScript**. For **Python**, see the [installation guide](/v2/first-steps/installation).
</Note>

## 1) Create a sample project

<CodeGroup>
```bash Bash
npx create-browser-app
```
</CodeGroup>

## 2) Run it

Follow the CLI prompts to enter the project directory and add your API keys. Then run the example script.

<CodeGroup>
```bash Bash
cd my-stagehand-app # Enter the project directory
cp .env.example .env  # Add your API keys
npm start # Run the example script
```
</CodeGroup>

## 3) Use Stagehand (act, extract, observe)

The scaffold includes an index.ts file that contains the example script. Here's what it looks like:

<CodeGroup>
```typescript TypeScript
import "dotenv/config";
import { Stagehand } from "@browserbasehq/stagehand";

async function main() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE"
  });

  await stagehand.init();

  console.log(`Stagehand Session Started`);
  console.log(`Watch live: https://browserbase.com/sessions/${stagehand.browserbaseSessionID}`);

  const page = stagehand.page;

  await page.goto("https://stagehand.dev");

  const extractResult = await page.extract("Extract the value proposition from the page.");
  console.log(`Extract result:\n`, extractResult);

  const actResult = await page.act("Click the 'Evals' button.");
  console.log(`Act result:\n`, actResult);

  const observeResult = await page.observe("What can I click on this page?");
  console.log(`Observe result:\n`, observeResult);

  const agent = await stagehand.agent({
    instructions: "You're a helpful assistant that can control a web browser.",
  });

  const agentResult = await agent.execute("What is the most accurate model to use in Stagehand?");
  console.log(`Agent result:\n`, agentResult);

  await stagehand.close();
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});

```
</CodeGroup>

<Tip>
To use, set provider keys in `.env` (e.g., `OPENAI_API_KEY`). For cloud browsers, add `BROWSERBASE_API_KEY` and `BROWSERBASE_PROJECT_ID`.
</Tip>

## Next steps

Learn about the Stagehand primitives: act, extract, observe, and agent.

<CardGroup cols={2}>
  <Card 
    title="Act" 
    icon="arrow-pointer" 
    href="/v2/basics/act"
  >
    Perform actions on web pages with natural language
  </Card>
  
  <Card 
    title="Extract" 
    icon="download" 
    href="/v2/basics/extract"
  >
    Get structured data with Zod schemas
  </Card>
  
  <Card 
    title="Observe" 
    icon="eye" 
    href="/v2/basics/observe"
  >
    Discover available elements and actions
  </Card>
  
  <Card 
    title="Agent" 
    icon="robot" 
    href="/v2/basics/agent"
  >
    Autonomous multi-step browser workflows
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v2/integrations/crew-ai/configuration.mdx
================================================
---
title: "Use CrewAI to Automate Browser Tasks"
sidebarTitle: Configuration
description: "Create intelligent agents that can interact with websites and automate browser tasks using natural language instructions"
---

This guide walks you through setting up CrewAI with Browserbase to create agents that can perform web automation tasks using natural language instructions.

## Step 1: Install Dependencies

Install the required packages for CrewAI and Stagehand integration:

```bash
pip install stagehand-py crewai crewai-tools
```

## Step 2: Configure Environment Variables

You'll need API keys from three services:

1. **Browserbase API Key and Project ID**: Get these from your [Browserbase dashboard](https://www.browserbase.com/)
2. **LLM API Key**: Get an API key from [OpenAI](https://platform.openai.com/api-keys) or [Anthropic](https://console.anthropic.com/)

Store your API keys securely as environment variables:

```bash
BROWSERBASE_API_KEY="your-browserbase-api-key"
BROWSERBASE_PROJECT_ID="your-browserbase-project-id"
OPENAI_API_KEY="your-openai-api-key"
ANTHROPIC_API_KEY="your-anthropic-api-key"
```

## Step 3: Create Your First Agent

Create a Python script with a basic CrewAI agent:

```python
import os
from crewai import Agent, Task, Crew
from crewai_tools import StagehandTool
from stagehand.schemas import AvailableModel

# Get API keys from environment
browserbase_api_key = os.environ.get("BROWSERBASE_API_KEY")
browserbase_project_id = os.environ.get("BROWSERBASE_PROJECT_ID")
model_api_key = os.environ.get("OPENAI_API_KEY")  # or ANTHROPIC_API_KEY

# Initialize the StagehandTool
stagehand_tool = StagehandTool(
    api_key=browserbase_api_key,
    project_id=browserbase_project_id,
    model_api_key=model_api_key,
    model_name=AvailableModel.GPT_4O,  # or AvailableModel.CLAUDE_3_7_SONNET_LATEST
)

# Create an agent with the tool
researcher = Agent(
    role="Web Researcher",
    goal="Find and summarize information from websites",
    backstory="I'm an expert at finding information online.",
    verbose=True,
    tools=[stagehand_tool],
)
```

## Step 4: Create and Run a Task

Define a task for your agent and execute it:

```python
# Create a task that uses the tool
research_task = Task(
    description="Go to https://www.example.com and tell me what you see on the homepage.",
    agent=researcher,
)

# Run the crew
crew = Crew(
    agents=[researcher],
    tasks=[research_task],
    verbose=True,
)

try:
    result = crew.kickoff()
    print(result)
finally:
    # Clean up resources
    stagehand_tool.close()
```

## Step 5: Run Your Script

Execute your Python script:

```bash
python your_crew_script.py
```

## Advanced Configuration

Customize the StagehandTool behavior with additional parameters:

```python
stagehand_tool = StagehandTool(
    api_key=browserbase_api_key,
    project_id=browserbase_project_id, 
    model_api_key=model_api_key,
    model_name=AvailableModel.CLAUDE_3_7_SONNET_LATEST,
    dom_settle_timeout_ms=5000,  # Wait longer for DOM to settle
    headless=True,  # Run browser in headless mode
    self_heal=True,  # Attempt to recover from errors
    wait_for_captcha_solves=True,  # Wait for CAPTCHA solving
    verbose=1,  # Control logging verbosity (0-3)
)
```

## Example Tasks

<Tabs>
  <Tab title="Form Submission" value="form-submission" label="Python">
    ```python
    form_task = Task(
        description="""
        Submit a contact form:
        1. Go to https://example.com/contact
        2. Fill out the form with name 'John Doe', email 'john@example.com'
        3. Submit and confirm success
        """,
        agent=researcher,
    )
    ```
  </Tab>
  <Tab title="Data Extraction" value="data-extraction" label="Python">
    ```python
    extraction_task = Task(
        description="""
        Extract product information:
        1. Go to the products page
        2. Extract all product names, prices, and descriptions
        3. Format as structured data
        """,
        agent=researcher,
    )
    ```
  </Tab>
  <Tab title="Multi-step Navigation" value="multi-step-navigation" label="Python">
    ```python
    navigation_task = Task(
        description="""
        Navigate and analyze:
        1. Start at homepage
        2. Navigate to products section  
        3. Filter by 'Electronics' category
        4. Find and extract details of highest-rated product
        """,
        agent=researcher,
    )
    ```
  </Tab>
</Tabs>

<CardGroup cols={2}>
  <Card title="CrewAI Documentation" icon="book" href="https://docs.crewai.com/">
    Dive into the CrewAI documentation to learn more about its capabilities and integrations.
  </Card>
  <Card title="Browserbase Documentation" icon="book" href="https://docs.browserbase.com/">
    Access the Browserbase documentation for comprehensive guides and resources.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/integrations/crew-ai/introduction.mdx
================================================
---
title: "CrewAI Introduction"
sidebarTitle: Introduction
description: "Automate browser tasks using natural language instructions with CrewAI"
---

## Overview

This guide shows you how to use CrewAI with Browserbase to create intelligent agents that can automate web interactions. By the end of this guide, you'll know how to:

- Set up CrewAI with the StagehandTool
- Create agents that can interact with websites
- Automate browser tasks using natural language instructions
- Extract structured data from web pages

## When You'd Use This

The CrewAI integration is perfect for scenarios where you need intelligent web automation:

- **Research automation**: Have agents research information across multiple websites
- **Data collection**: Extract structured data from e-commerce sites, job boards, or news sites
- **Form automation**: Automatically fill out and submit forms based on specific criteria
- **Multi-step workflows**: Execute complex browser workflows that require decision-making

The StagehandTool wraps the Stagehand Python SDK to provide CrewAI agents with the ability to control a real web browser and interact with websites using three core primitives:

1. **Act**: Perform actions like clicking, typing, or navigating
2. **Extract**: Extract structured data from web pages
3. **Observe**: Identify and analyze elements on the page

<CardGroup cols={1}>
<Card title="CrewAI Configuration" icon="gear" href="/integrations/crew-ai/configuration">
  Learn how to configure and use the StagehandTool with CrewAI agents for web automation tasks
</Card>
</CardGroup>

================================================
FILE: packages/docs/v2/integrations/langchain/configuration.mdx
================================================
---
title: "LangChain JS Configuration"
sidebarTitle: Configuration
description: "Set up Stagehand with LangChain JS to create intelligent web automation agents"
---

This guide walks you through integrating Stagehand with LangChain JS to build powerful web automation workflows using natural language instructions.

## Step 1: Install Dependencies

Install the required packages for LangChain JS and Stagehand integration:

```bash
npm install @langchain/langgraph @langchain/community @langchain/core @browserbasehq/stagehand
```

## Step 2: Configure Environment Variables

For remote browser automation, set up your Browserbase credentials:

```bash
BROWSERBASE_API_KEY="your-browserbase-api-key"
BROWSERBASE_PROJECT_ID="your-browserbase-project-id"
```

## Step 3: Create a Stagehand Instance

Initialize Stagehand with your preferred configuration:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// For local development
const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 2,
    enableCaching: false,
});

// For production with Browserbase
const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    enableCaching: true,
});
```

## Step 4: Generate the StagehandToolkit

Create the toolkit that provides LangChain-compatible tools:

```typescript
import { StagehandToolkit } from '@langchain/community/agents/toolkits/stagehand';

const stagehandToolkit = await StagehandToolkit.fromStagehand(stagehand);
```

## Step 5: Use Individual Tools

The toolkit provides four specialized tools for web automation:

### Available Tools

- **stagehand_navigate**: Navigate to specific URLs
- **stagehand_act**: Perform browser actions (clicking, typing, etc.)
- **stagehand_extract**: Extract structured data using schemas  
- **stagehand_observe**: Analyze page elements and possible actions

### Basic Tool Usage

```typescript
import { z } from "zod";

// Navigate to a website
const navigateTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_navigate"
);
await navigateTool.invoke("https://www.google.com");

// Perform an action
const actionTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_act"
);
await actionTool.invoke('Search for "OpenAI"');

// Observe the page
const observeTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_observe"
);
const result = await observeTool.invoke(
    "What actions can be performed on the current page?"
);
console.log(JSON.parse(result));

// Extract structured data
const extractTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_extract"
);
const extractResult = await extractTool.invoke({
    instruction: "Extract the main heading and description",
    schema: z.object({
        heading: z.string(),
        description: z.string(),
    }),
});
console.log(extractResult);
```

## Step 6: Build LangGraph Agents

Integrate with LangGraph for complex automation workflows:

```typescript
import { createReactAgent } from "@langchain/langgraph/prebuilt";

// Create an LLM
const llm = new ChatOpenAI({
    model: "gpt-4",
    temperature: 0,
});

// Create an agent with Stagehand tools
const agent = createReactAgent({
    llm,
    tools: stagehandToolkit.tools,
});

// Execute a complex workflow
const result = await agent.invoke({
    messages: [
        {
            role: "user", 
            content: "Go to example.com, find the contact form, and extract all the form fields"
        }
    ]
});
```

## Advanced Configuration

### Custom Stagehand Configuration

```typescript
const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 2,
    enableCaching: true,
    headless: true,
    domSettleTimeoutMs: 5000,
});
```

### Error Handling

```typescript
try {
    const result = await agent.invoke({
        messages: [{ role: "user", content: "Navigate to invalid-url.com" }]
    });
} catch (error) {
    console.error("Automation failed:", error);
} finally {
    // Clean up resources
    await stagehand.close();
}
```

## Example Workflows

<Tabs>
  <Tab title="Data Extraction" value="data-extraction" label="TypeScript">
    ```typescript
    const extractionAgent = createReactAgent({
        llm,
        tools: stagehandToolkit.tools,
    });

    const result = await extractionAgent.invoke({
        messages: [{
            role: "user",
            content: `
                Go to news-website.com and extract:
                1. All article headlines
                2. Publication dates  
                3. Author names
                Format as structured JSON
            `
        }]
    });
    ```
  </Tab>
  <Tab title="Form Automation" value="form-automation" label="TypeScript">
    ```typescript
    const formAgent = createReactAgent({
        llm,
        tools: stagehandToolkit.tools,
    });

    const result = await formAgent.invoke({
        messages: [{
            role: "user", 
            content: `
                Navigate to contact-form.com and:
                1. Fill out the contact form with:
                   - Name: John Doe
                   - Email: john@example.com
                   - Message: Inquiry about services
                2. Submit the form
                3. Confirm submission success
            `
        }]
    });
    ```
  </Tab>
  <Tab title="Multi-site Research" value="multi-site-research" label="TypeScript">
    ```typescript
    const researchAgent = createReactAgent({
        llm,
        tools: stagehandToolkit.tools,
    });

    const result = await researchAgent.invoke({
        messages: [{
            role: "user",
            content: `
                Research product pricing by:
                1. Visit competitor1.com and extract pricing info
                2. Visit competitor2.com and extract pricing info  
                3. Compare features and prices
                4. Provide summary analysis
            `
        }]
    });
    ```
  </Tab>
</Tabs>

<CardGroup cols={1}>
  <Card title="LangChain JS Documentation" icon="book" href="https://js.langchain.com/docs/integrations/tools/stagehand/">
    Official LangChain JS documentation for the Stagehand integration
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/integrations/langchain/introduction.mdx
================================================
---
title: "Langchain JS Introduction"
sidebarTitle: Introduction
description: "Integrate Stagehand with Langchain JS for intelligent web automation"
---

## Overview

This guide shows you how to use Stagehand with Langchain JS to create intelligent agents that can automate web interactions. By the end of this guide, you'll know how to:

- Set up the StagehandToolkit with Langchain JS
- Create agents that can navigate and interact with websites
- Extract structured data using natural language instructions
- Build complex automation workflows with LangGraph

## When You'd Use This

The Langchain JS integration is perfect for scenarios where you need intelligent web automation with advanced reasoning:

- **AI-driven research**: Create agents that can research information across multiple websites and synthesize findings
- **Dynamic form filling**: Automatically fill out complex forms based on contextual requirements
- **Data extraction workflows**: Extract and transform data from multiple sources with intelligent navigation
- **Multi-step web processes**: Execute complex browser workflows that require decision-making and adaptation

<CardGroup cols={1}>
<Card title="Langchain JS Configuration" icon="gear" href="/integrations/langchain/configuration">
  Learn how to set up and configure the StagehandToolkit with Langchain JS agents
</Card>
</CardGroup>

================================================
FILE: packages/docs/v2/integrations/mcp/configuration.mdx
================================================
---
title: "Browserbase MCP Server Configuration"
sidebarTitle: "Configuration"
description: "Configure your browser automation with command-line flags, environment variables, and advanced options"
---

## Configuration Overview

The Browserbase MCP server supports extensive configuration options through command-line flags and environment variables. Configure browser behavior, proxy settings, stealth modes, model selection, and more to customize your browser automation workflows.

<Note>
Command-line flags are only available when running the server locally (`npx @browserbasehq/mcp-server-browserbase` with flags or local development setup).
</Note>

## Environment Variables

Configure the essential Browserbase credentials and optional debugging settings:

<CardGroup cols={2}>
<Card title="BROWSERBASE_API_KEY" icon="key">
Your Browserbase API key for authentication
</Card>

<Card title="BROWSERBASE_PROJECT_ID" icon="key">
Your Browserbase project ID
</Card>

</CardGroup>

## Command-Line Flags

### Available Flags

| Flag | Description |
|------|-------------|
| `--proxies` | Enable Browserbase proxies for the session |
| `--advancedStealth` | Enable Browserbase Advanced Stealth (Scale Plan only) |
| `--keepAlive` | Enable Browserbase Keep Alive Session |
| `--contextId <contextId>` | Specify a Browserbase Context ID to use |
| `--persist [boolean]` | Whether to persist the Browserbase context (default: true) |
| `--port <port>` | Port to listen on for HTTP/SHTTP transport |
| `--host <host>` | Host to bind server to (default: localhost, use 0.0.0.0 for all interfaces) |
| `--cookies [json]` | JSON array of cookies to inject into the browser |
| `--browserWidth <width>` | Browser viewport width (default: 1024) |
| `--browserHeight <height>` | Browser viewport height (default: 768) |
| `--modelName <model>` | The model to use for Stagehand (default: google/gemini-2.5-flash-lite) |
| `--modelApiKey <key>` | API key for the custom model provider (required when using custom models) |
| `--experimental` | Enable experimental features (default: false) |

## Configuration Examples

### Basic Configuration

<Tabs>
<Tab title="Remote URL (SHTTP)">


<CodeGroup>
```json Direct SHTTP
{
  "mcpServers": {
    "browserbase": {
      "url": "your-smithery-url.com"
    }
  }
}
```
</CodeGroup>

When using our remote hosted server, we provide the LLM costs for Gemini, the [best performing model](https://www.stagehand.dev/evals) in [Stagehand](https://www.stagehand.dev).
</Tab>

<Tab title="NPM Package">

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Local STDIO">
```json
{
  "mcpServers": {
    "browserbase": {
      "command": "node",
      "args": ["/path/to/mcp-server-browserbase/cli.js"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Local SHTTP">
```bash
# Start server
node cli.js --port 8931
```

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "http://localhost:8931/mcp",
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>

### Advanced Features

<Tabs>
<Tab title="Proxies">
Enable Browserbase proxies for IP rotation and geo-location testing.

<Panel>
[Learn more about Browserbase Proxies](https://docs.browserbase.com/features/proxies)
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase", "--proxies"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Advanced Stealth">
Enable advanced anti-detection features for enhanced stealth browsing.

<Panel>
[Learn more about Advanced Stealth](https://docs.browserbase.com/features/stealth-mode#advanced-stealth-mode)

**Note:** Advanced Stealth is only available for Scale Plan users.
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase", "--advancedStealth"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Contexts">
Use persistent browser contexts to maintain authentication and state across sessions.

<Panel>
[Learn more about Browserbase Contexts](https://docs.browserbase.com/features/contexts)
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase", "--contextId", "your_context_id"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id"
      }
    }
  }
}
```
</Tab>
</Tabs>

### Browser Customization

<Tabs>
<Tab title="Viewport Sizing">
Customize browser window dimensions. Default is 1024x768. Recommended aspect ratios: 16:9.

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--browserWidth", "1920",
        "--browserHeight", "1080"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```

**Common Resolutions:**
- Desktop: 1920x1080, 1280x720, 1024x768
- Mobile: 375x667 (iPhone), 360x640 (Android)
- Tablet: 768x1024 (iPad)
</Tab>

<Tab title="Cookie Injection">
Inject session cookies for authentication. Useful when persistent contexts don't handle session cookies.

<Panel>
Cookies must be in [Playwright Cookie format](https://playwright.dev/docs/api/class-browsercontext#browser-context-cookies).
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--cookies",
        "[{\"name\": \"session\", \"value\": \"abc123\", \"domain\": \".example.com\", \"path\": \"/\", \"httpOnly\": true, \"secure\": true}]"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>

## Model Configuration

Configure AI models for enhanced browser automation. Stagehand defaults to Google's Gemini 2.5 Flash Lite but supports multiple providers.

<Warning>
When using any custom model (non-default), you must provide your own API key for that model provider using the `--modelApiKey` flag.
</Warning>

<Tabs>
<Tab title="Available Models">
**Google Gemini** (Default)
- `google/gemini-2.5-flash-lite` (default)
- `google/gemini-1.5-pro`
- `google/gemini-1.5-flash`

**OpenAI**
- `openai/gpt-4o`
- `openai/gpt-4o-mini`
- `openai/o1-mini`
- `openai/o1-preview`
- `openai/o3-mini`

**Anthropic Claude**
- `anthropic/claude-sonnet-4-6`
- `anthropic/claude-sonnet-4-5-20250929`

[View full list of supported models](https://docs.stagehand.dev/examples/custom_llms#supported-llms)
</Tab>

<Tab title="Configuration Examples">
<CodeGroup>
```json OpenAI GPT-4o
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--modelName", "openai/gpt-4o",
        "--modelApiKey", "your_openai_api_key"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id"
      }
    }
  }
}
```

```json Claude Sonnet
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--modelName", "anthropic/claude-sonnet-4-6",
        "--modelApiKey", "your_anthropic_api_key"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id"
      }
    }
  }
}
```
</CodeGroup>
</Tab>
</Tabs>

## Development Configuration

<Tabs>
<Tab title="Debug Mode">
Enable detailed logging for troubleshooting and development.

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key",
        "DEBUG": "true"
      }
    }
  }
}
```
</Tab>

<Tab title="Custom Host/Port">
Configure custom host and port for SHTTP transport.

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--host", "0.0.0.0",
        "--port", "8080"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>

## Best Practices

<Accordion title="Performance - How can I optimize browser automation performance?">
- Use appropriate viewport sizes for your use case
- Enable proxies only when needed for geo-location
- Choose efficient models (Gemini Flash for speed, GPT-4o for accuracy)
- Reuse contexts for authentication persistence
</Accordion>

<Accordion title="Security - What security measures should I implement?">
- Store API keys securely in environment variables
- Use Advanced Stealth for sensitive operations
- Implement proper session management
- Rotate cookies and contexts regularly
</Accordion>

<Accordion title="Development - What are the recommended development practices?">
- Enable debug mode during development
- Use context persistence for faster iteration
- Test with different viewport sizes
- Monitor session usage and quotas
</Accordion>

<Accordion title="Production - How should I configure for production environments?">
- Use NPM installation for reliability
- Configure appropriate timeouts
- Implement error handling and retries
- Monitor performance and resource usage
</Accordion>

## Further Reading

<CardGroup cols={3}>
<Card title="Browserbase Documentation" icon="globe" href="https://docs.browserbase.com">
Complete platform documentation
</Card>

<Card title="Stagehand Docs" icon="robot" href="https://docs.stagehand.dev/">
AI-powered browser automation
</Card>

<Card title="Support" icon="headset" href="mailto:support@browserbase.com">
Get help from our team
</Card>
</CardGroup>


================================================
FILE: packages/docs/v2/integrations/mcp/introduction.mdx
================================================
---
title: "Browserbase MCP Server"
sidebarTitle: "Introduction"
description: "AI-powered browser automation through Model Context Protocol integration with Stagehand"
---

## Overview

The Browserbase MCP Server brings powerful browser automation capabilities to MCP clients through the Model Context Protocol (MCP). Built on top of [Stagehand](https://docs.stagehand.dev/), this integration provides AI-powered web automation using natural language commands.

<Info>
  The hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http)
  endpoint is served on Browserbase infrastructure.
  You can also run the MCP server locally with STDIO, but we recommend the
  hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http)
  endpoint for most users.
</Info>

## Key Features

<CardGroup cols={2}>
<Card title="Natural Language Automation" icon="wand-magic-sparkles">
Control browsers using plain English commands like "click the login button" or "fill out the contact form"
</Card>

<Card title="Web Interaction" icon="browser">
  Navigate, click, and fill forms with ease
</Card>

<Card title="Data Extraction" icon="download">
  Extract structured data from any website automatically
</Card>

<Card title="Session Lifecycle" icon="route">
  Create, reuse, and close browser sessions with explicit MCP tools
</Card>

</CardGroup>

## Core Benefits

<Tabs>
<Tab title="Ease of Use">
<CardGroup cols={2}>
<Card title="Intuitive Commands" icon="wand-magic-sparkles">
No need to learn complex selectors or automation syntax. Simply describe what you want to do in natural language.
</Card>

<Card title="Quick Setup" icon="rocket">
  Get started in minutes with either hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) or local STDIO.
</Card>

<Card title="Smart Automation" icon="brain">
Stagehand's AI understands web page context and can adapt to different layouts and designs.
</Card>
</CardGroup>
</Tab>

<Tab title="Powerful Capabilities">
<CardGroup cols={2}>
<Card title="Full Browser Control" icon="browser">
Navigate, click, type, scroll, and interact with any web element.
</Card>

<Card title="Data Intelligence" icon="chart-line">
  Extract structured information from complex web pages automatically.
</Card>

<Card title="Session Persistence" icon="cookie-bite">
Maintain authentication states and cookies across multiple interactions.
</Card>
</CardGroup>
</Tab>

<Tab title="Enterprise Ready">
<CardGroup cols={2}>
<Card title="Reliable Infrastructure" icon="server">
Hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) runs on Browserbase infrastructure for consistent performance.
</Card>

<Card title="Scalable Architecture" icon="arrows-up-to-line">
  Handle multiple concurrent sessions and high-volume automation tasks.
</Card>

<Card title="Security Features" icon="shield-check">
  Stealth mode, proxy support, and advanced anti-detection capabilities.
</Card>

<Card title="Comprehensive Logging" icon="file-lines">
Detailed session recordings and debugging information.
</Card>
</CardGroup>
</Tab>
</Tabs>

## Use Cases

<Tabs>
<Tab title="Web Scraping & Data Collection">
<CardGroup cols={2}>
<Card title="E-commerce Monitoring" icon="store">
Track product prices, availability, and competitor information
</Card>

<Card title="Market Research" icon="chart-bar">
  Gather data from multiple sources for analysis and reporting
</Card>

<Card title="Content Aggregation" icon="newspaper">
  Collect articles, posts, and media from various websites
</Card>

<Card title="Lead Generation" icon="users">
Extract contact information and business data from directories
</Card>
</CardGroup>
</Tab>

<Tab title="Testing">
<CardGroup cols={2}>
<Card title="Automated Testing" icon="flask">
Create comprehensive test suites for web applications
</Card>

<Card title="Cross-Browser Validation" icon="browsers">
  Test functionality across different browser environments
</Card>

<Card title="User Journey Testing" icon="route">
  Simulate real user interactions and workflows
</Card>

<Card title="Performance Monitoring" icon="gauge">
Track page load times and user experience metrics
</Card>
</CardGroup>
</Tab>

<Tab title="Workflow Automation">
<CardGroup cols={2}>
<Card title="Form Automation" icon="file-contract">
Automatically fill and submit complex web forms
</Card>

<Card title="Report Generation" icon="chart-line">
  Extract data and generate automated reports
</Card>

<Card title="Social Media Management" icon="share-nodes">
  Schedule posts and monitor engagement across platforms
</Card>

<Card title="Administrative Tasks" icon="clipboard-check">
Automate repetitive web-based business processes
</Card>
</CardGroup>
</Tab>
</Tabs>

## Getting Started

<Steps>
<Step title="Install the MCP Server">
Choose hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) (recommended) or local STDIO based on your needs.
</Step>

<Step title="Configure Authentication">
  Set up your Browserbase API credentials in MCP configuration. Get API keys
  from the [Browserbase Dashboard](https://www.browserbase.com/overview).
</Step>

<Step title="Start Automating">
Begin using natural language commands to control browsers through your MCP client.
</Step>
</Steps>

<Tip>
  Ready to get started? Check out the [Setup Guide](/v2/integrations/mcp/setup).
</Tip>

## Further Reading

<CardGroup cols={3}>
<Card title="Setup Guide" icon="rocket" href="/v2/integrations/mcp/setup">
Get started with installation and configuration
</Card>

<Card title="MCP Docs" icon="book" href="https://modelcontextprotocol.io/introduction">
Learn more about the MCP protocol
</Card>

<Card title="Browserbase Docs" icon="globe" href="https://docs.browserbase.com">
Explore Browserbase features and capabilities
</Card>
</CardGroup>


================================================
FILE: packages/docs/v2/integrations/mcp/setup.mdx
================================================
---
title: "Browserbase MCP Server Setup"
sidebarTitle: "Setup"
description: "Add the Browserbase MCP Server to your MCP client"
---

## Quick Installation

<Card title="Install with Cursor" icon="arrow-pointer" href="cursor://anysphere.cursor-deeplink/mcp/install?name=browserbase&config=eyJ1cmwiOiJodHRwczovL21jcC5icm93c2VyYmFzZS5jb20vbWNwP2Jyb3dzZXJiYXNlQXBpS2V5PVlPVVJfQlJPV1NFUkJBU0VfQVBJX0tFWSJ9">
  One-click installation directly in Cursor
</Card>

You can also add Browserbase MCP to Claude Code with a single command:

```bash
claude mcp add --transport http browserbase "https://mcp.browserbase.com/mcp?browserbaseApiKey=YOUR_BROWSERBASE_API_KEY"
```

We support both local STDIO and hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) (SHTTP). We recommend hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) for most users.

## Endpoint

Hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) endpoint (served on Browserbase infrastructure):

```text
https://mcp.browserbase.com/mcp
```

## Prerequisites

<Steps>
<Step title="Get your Browserbase credentials">
Get your Browserbase API key from the [Browserbase Dashboard](https://www.browserbase.com/overview).

<Frame>
<img src="/images/quickstart/api-key.png" alt="Browserbase API Key settings" />
</Frame>

Then copy your API Key directly from the input.
</Step>
</Steps>

## Query Parameters (Hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http))

### Required for tool calls

<CardGroup cols={1}>
<Card title="browserbaseApiKey" icon="key">
Browserbase API key.
</Card>
</CardGroup>

### Optional

| Query Param       | Type           | Behavior                                   |
| ----------------- | -------------- | ------------------------------------------ |
| `modelName`       | string         | Defaults to `google/gemini-2.5-flash-lite` |
| `modelApiKey`     | string         | Required when `modelName` is non-default   |
| `keepAlive`       | boolean string | `"true"` or `"false"`                      |
| `proxies`         | boolean string | `"true"` or `"false"`                      |
| `advancedStealth` | boolean string | `"true"` or `"false"`                      |

<Warning>
  Boolean query values must be exact strings: `"true"` or `"false"`.
</Warning>

## Available Tools

<Accordion title="navigate">
Navigate to any URL in the browser

<ParamField path="url" type="string" required>
  The URL to navigate to
</ParamField>
</Accordion>

<Accordion title="act">
Perform an action on the web page using natural language

<ParamField path="action" type="string" required>
  The action to perform (e.g., "click the login button", "fill form field")
</ParamField>
</Accordion>

<Accordion title="observe">
Observe and find actionable elements on the page.

<ParamField path="instruction" type="string" required>
  Specific instruction for observation (e.g., "find the login button", "locate search form")
</ParamField>
</Accordion>

<Accordion title="extract">
Extract data from the current page.

<ParamField path="instruction" type="string">
Optional extraction instruction.
</ParamField>
</Accordion>

<Accordion title="start">
Create or reuse a Browserbase session and set it as active for the current MCP transport session.

<Info>No input parameters required.</Info>

<ResponseField name="sessionId" type="string">
Browserbase session ID.
</ResponseField>
</Accordion>

<Accordion title="end">
Close the active Browserbase session for the current MCP transport session.

<Info>No input parameters required.</Info>
</Accordion>

## Local Command-Line Flags

<Note>
Command-line flags are only available when running the server locally (`npx @browserbasehq/mcp-server-browserbase` with flags or local development setup).
</Note>

| Flag | Description |
|------|-------------|
| `--proxies` | Enable Browserbase proxies for the session |
| `--advancedStealth` | Enable Browserbase Advanced Stealth (Scale Plan only) |
| `--keepAlive` | Enable Browserbase Keep Alive Session |
| `--contextId <contextId>` | Specify a Browserbase Context ID to use |
| `--persist [boolean]` | Whether to persist the Browserbase context (default: true) |
| `--port <port>` | Port to listen on for HTTP or [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) transport |
| `--host <host>` | Host to bind server to (default: localhost, use 0.0.0.0 for all interfaces) |
| `--browserWidth <width>` | Browser viewport width (default: 1024) |
| `--browserHeight <height>` | Browser viewport height (default: 768) |
| `--modelName <model>` | The model to use for Stagehand (default: google/gemini-2.5-flash-lite) |
| `--modelApiKey <key>` | API key for the custom model provider (required when using custom models) |
| `--experimental` | Enable experimental features (default: false) |

## Installation Methods

<Tabs>
<Tab title="Hosted (recommended)">

Use your MCP client config:

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "https://mcp.browserbase.com/mcp?browserbaseApiKey=YOUR_BROWSERBASE_API_KEY"
    }
  }
}
```

For custom models, include `modelName` and `modelApiKey`:

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "https://mcp.browserbase.com/mcp?browserbaseApiKey=YOUR_BROWSERBASE_API_KEY&modelName=openai/gpt-4.1&modelApiKey=YOUR_MODEL_API_KEY"
    }
  }
}
```

</Tab>

<Tab title="NPM Package (STDIO)">
The easiest way to get started locally is using our NPM package.

<Note>
If you would like to use a different model, you have to pass the model name and keys in the args. More info in the [Local Command-Line Flags](#local-command-line-flags) section.
</Note>

<Steps>
<Step title="Add to MCP Config">
Go into your MCP Config JSON and add the Browserbase Server:

<CodeGroup>
```json Claude Desktop
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</CodeGroup>
</Step>

<Step title="Restart your MCP client">
<Check>
That's it! Reload your MCP client and you will be able to use Browserbase.
</Check>
</Step>
</Steps>

</Tab>

<Tab title="Local Development">
For local development or customization, you can run the server locally.

<Steps>
<Step title="Clone and build">
```bash
# Clone the Repo
git clone https://github.com/browserbase/mcp-server-browserbase.git
cd mcp-server-browserbase

# Install the dependencies and build the project
npm install && npm run build
```
</Step>

<Step title="Choose your transport method">
You can run locally using either STDIO or [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http).

<Tabs>
<Tab title="STDIO">
Add the following to your MCP Config JSON file:

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "node",
      "args": ["/path/to/mcp-server-browserbase/cli.js"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Self-hosted Streamable HTTP">
First, run the server:

```bash
node cli.js --port 8931
```

Then add this to your MCP Config JSON file:

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "http://localhost:8931/mcp",
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>
</Step>

<Step title="Restart your client">
<Check>
Reload your MCP client and you should be good to go!
</Check>
</Step>
</Steps>
</Tab>
</Tabs>

## Verify Installation

<Steps>
<Step title="Restart your MCP client">
Restart/refresh your MCP client app and verify tools are available.
</Step>

<Step title="Test the integration">
Get started using our MCP Server by asking your MCP client to navigate to any page and see your Browserbase Browser in action on the [dashboard](https://www.browserbase.com/sessions).

<Tip>
Try: "Navigate to example.com and extract the main heading"
</Tip>
</Step>
</Steps>

## Further Reading

<CardGroup cols={3}>
<Card title="Model Context Protocol (MCP) Docs" icon="book" href="https://modelcontextprotocol.io/introduction">
Learn more about the MCP protocol
</Card>

<Card title="Browserbase Documentation" icon="globe" href="https://docs.browserbase.com">
Explore Browserbase features and capabilities
</Card>

<Card title="Support" icon="headset" href="mailto:support@browserbase.com">
Get help from our support team
</Card>
</CardGroup>


================================================
FILE: packages/docs/v2/integrations/mcp/tools.mdx
================================================
---
title: "Browserbase MCP Server Tools"
sidebarTitle: "Tools"
description: "This guide covers the specialized tools available in the Browserbase MCP server for browser automation and interaction."
---

## Overview

The Browserbase MCP server provides tools for browser automation and session management through a transport-scoped active session.

## Core Browser Automation Tools

These are the primary tools for modern web automation using natural language commands.

<Accordion title="navigate">
Navigate to any URL in the browser

<ParamField path="url" type="string" required>
  The URL to navigate to
</ParamField>
</Accordion>

<Accordion title="act">
Perform an action on the web page using natural language

<ParamField path="action" type="string" required>
  The action to perform (e.g., "click the login button", "fill form field")
</ParamField>

</Accordion>

<Accordion title="observe">
Observe and find actionable elements on the page

<ParamField path="instruction" type="string" required>
  Specific instruction for observation (e.g., "find the login button", "locate search form")
</ParamField>
</Accordion>

<Accordion title="extract">
Extract data from the current page.

<ParamField path="instruction" type="string">
  Optional extraction instruction.
</ParamField>
</Accordion>

## Session Management

<Accordion title="start">
Create or reuse a Browserbase session and set it as active for the current MCP transport session.

<Info>No input parameters required.</Info>

<ResponseField name="sessionId" type="string">
  Browserbase session ID.
</ResponseField>
</Accordion>

<Accordion title="end">
Close the active Browserbase session for the current MCP transport session.

<Info>No input parameters required.</Info>

</Accordion>

## Further Reading

<CardGroup cols={3}>
<Card title="Model Context Protocol (MCP) Docs" icon="book" href="https://modelcontextprotocol.io/introduction">
Learn more about the MCP protocol
</Card>

<Card title="Stagehand Documentation" icon="robot" href="https://docs.stagehand.dev/">
Explore Stagehand's AI-powered browser automation
</Card>

<Card title="Support" icon="headset" href="mailto:support@browserbase.com">
Get help from our support team
</Card>
</CardGroup>


================================================
FILE: packages/docs/v2/integrations/vercel/configuration.mdx
================================================
---
title: Use Stagehand in Next.js
sidebarTitle: Configuration
description: Next.js is a popular framework for developing web-based applications in production. It powers Stagehand apps like [Director](https://director.ai), [Brainrot](https://brainrot.run) and [Open Operator](https://operator.browserbase.com).
---

<Card
  title="Check out the Stagehand Next.js Quickstart"
  icon="github"
  href="https://github.com/browserbase/stagehand-nextjs-quickstart"
>
  Clone our [GitHub repo](https://github.com/browserbase/stagehand-nextjs-quickstart) to get started with Stagehand in Next.js.
</Card>

## Add Stagehand to an existing Next.js project
If you'd like to add Stagehand to an existing Next.js project, you can do so by installing the dependencies:
<Tabs>
	<Tab title="npm">
	```bash
	npm install @browserbasehq/stagehand @browserbasehq/sdk playwright zod
	```
	</Tab>

	<Tab title="pnpm">
	```bash
	pnpm add @browserbasehq/stagehand @browserbasehq/sdk playwright zod
	```
	</Tab>

	<Tab title="yarn">
	```bash
	yarn add @browserbasehq/stagehand @browserbasehq/sdk playwright zod
	```
	</Tab>
</Tabs>

### Write a server action
Next, let's define our `main` function as a server action in `app/stagehand/main.ts`. This file will have the following three functions:

1. **`main`: Run the main Stagehand script**
2. **`runStagehand`: Initialize and run the `main` function**
3. **`startBBSSession`: Start a Browserbase session**

```ts app/stagehand/main.ts
// 🤘 Welcome to Stagehand!
// This file is from the [Stagehand docs](https://docs.stagehand.dev/sections/examples/nextjs).

"use server";

import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod/v3";
import { Browserbase } from "@browserbasehq/sdk";

/**
 * Run the main Stagehand script
 */
async function main(stagehand: Stagehand) {
  // You can use the `page` instance to write any Playwright code
  // For more info: https://playwright.dev/docs/pom
  const page = stagehand.page;

  // In this example, we'll get the title of the Stagehand quickstart page
  await page.goto("https://docs.stagehand.dev/");
  await page.act("click the quickstart link");
  const { title } = await page.extract({
    instruction: "extract the main heading of the page",
    schema: z.object({
      title: z.string(),
    }),
  });

  return title;
}

/**
 * Initialize and run the main() function
 */
export async function runStagehand(sessionId?: string) {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    apiKey: process.env.BROWSERBASE_API_KEY,
    projectId: process.env.BROWSERBASE_PROJECT_ID,
    verbose: 1,
    logger: console.log,
    browserbaseSessionID: sessionId,
    disablePino: true,
  });
  await stagehand.init();
  await main(stagehand);
  await stagehand.close();
}

/**
 * Start a Browserbase session
 */
export async function startBBSSession() {
  const browserbase = new Browserbase();
  const session = await browserbase.sessions.create({
    projectId: process.env.BROWSERBASE_PROJECT_ID!,
  });
  const debugUrl = await browserbase.sessions.debug(session.id);
  return {
    sessionId: session.id,
    debugUrl: debugUrl.debuggerFullscreenUrl,
  };
}
```

### Create a client component
Next, let's create a client component that will start a Browserbase session and run the `main` function with the server actions we just defined. We'll first create a Browserbase session and embed the session in an iframe before running the `main` function.

```tsx app/components/stagehandEmbed.tsx
"use client";

import { useCallback, useState } from "react";
import { runStagehand, startBBSSession } from "@/app/stagehand/main";

export function StagehandEmbed() {
  const [sessionId, setSessionId] = useState<string | null>(null);
  const [debugUrl, setDebugUrl] = useState<string | null>(null);

  const startSession = useCallback(async () => {
    const { sessionId, debugUrl } = await startBBSSession();
    setSessionId(sessionId);
    setDebugUrl(debugUrl);
    await runStagehand(sessionId);
  }, []);

  return (
    <div>
      {!sessionId && <button onClick={startSession}>Start Session</button>}
      {sessionId && debugUrl && (
        <iframe src={debugUrl} className="w-full h-full" />
      )}
    </div>
  );
}
```

### Use the `StagehandEmbed` component
Now, we can use the `StagehandEmbed` component in our app.

```tsx app/page.tsx
import { StagehandEmbed } from "@/app/components/stagehandEmbed";

export default function Home() {
	return (
		<main>
			<StagehandEmbed />
		</main>
	)
}
```

## References

<CardGroup cols={2}>
  <Card title="Deploy Template" icon="rocket" href="https://vercel.com/templates/ai/stagehand-next-js-quickstart">
    One‑click deploy the Stagehand Next.js template on Vercel
  </Card>
  
  <Card title="Source Code" icon="github" href="https://github.com/browserbase/stagehand-nextjs-quickstart">
    Browse the complete template repository on GitHub
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v2/integrations/vercel/introduction.mdx
================================================
---
title: "Next.js + Vercel"
sidebarTitle: "Introduction"
description: "Build and deploy a Stagehand‑powered Next.js app to Vercel"
---

## Overview

The Stagehand + Next.js Quickstart is a production‑ready template that pairs Stagehand's AI browser automation with a modern Next.js app, deployable in one click on Vercel.

<CardGroup cols={3}>
  <Card title="Deploy Template" icon="rocket" href="https://vercel.com/templates/ai/stagehand-next-js-quickstart">
    One‑click deploy to Vercel with environment setup
  </Card>

  <Card title="Live Demo" icon="globe" href="https://stagehand-nextjs-quickstart.vercel.app">
    See the deployed template in action
  </Card>

  <Card title="Source Code" icon="github" href="https://github.com/browserbase/stagehand-nextjs-quickstart">
    Browse the repository on GitHub
  </Card>
</CardGroup>

## What you get

<CardGroup cols={2}>
  <Card title="App Router project" icon="browser">
    Next.js App Router scaffold with Tailwind styling
  </Card>
  <Card title="Server‑safe automation" icon="shield-check">
    Uses Browserbase for cloud browsers (works on Vercel functions)
  </Card>
  <Card title="Prewired config" icon="gear">
    `stagehand.config.ts` with model + provider switching
  </Card>
  <Card title="Automation ready" icon="robot">
    Example usage of Stagehand primitives
  </Card>
</CardGroup>

## Requirements

- **Node 18+** locally
- **Model key**: OpenAI or Anthropic (or plug a custom client)
- **Browserbase keys**: `BROWSERBASE_API_KEY` and `BROWSERBASE_PROJECT_ID` for cloud browsers

<Tip>
Local Playwright browsers are not available on Vercel. Set Stagehand to Browserbase when deploying.
</Tip>

## Links

<CardGroup cols={2}>
  <Card title="Quickstart" icon="rocket" href="/integrations/vercel/quickstart">
    Run locally and deploy to Vercel in minutes
  </Card>
  <Card title="TypeScript Quickstart" icon="code" href="/first-steps/quickstart">
    More templates, including Vercel deployment examples
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v2/references/act.mdx
================================================
---
title: act()
description: 'Complete API reference for the act() method'
icon: 'arrow-pointer'
---

<CardGroup cols={1}>
<Card title="Act" icon="arrow-pointer" href="/v2/basics/act">
  See how to use act() to perform browser actions
</Card>
</CardGroup>

### Method Signatures

<Tabs>
<Tab title="TypeScript">

```typescript
// String instruction
await page.act(instruction: string): Promise<ActResult>

// With ActOptions
await page.act(options: ActOptions): Promise<ActResult>

// Execute observed action
await page.act(observeResult: ObserveResult): Promise<ActResult>
```

**ActOptions Interface:**
```typescript
interface ActOptions {
  action: string;
  modelName?: AvailableModel;
  modelClientOptions?: ClientOptions;
  variables?: Record<string, string>;
  domSettleTimeoutMs?: number;
  timeoutMs?: number;
  iframes?: boolean;
}
```

</Tab>
<Tab title="Python">

```python
# String instruction
await page.act(instruction: str) -> ActResult

# With parameters
await page.act(
    instruction: str,
    variables: Dict[str, str] = None,
    dom_settle_timeout_ms: int = None,
    timeout_ms: int = None,
    model_name: AvailableModel = None,
    model_client_options: Dict = None,
    iframes: bool = None,
) -> ActResult

# Execute observed action
await page.act(observe_result: ObserveResult) -> ActResult
```

</Tab>
</Tabs>

### Parameters

<ParamField path="action" type="string" required>
  Natural language description of the action to perform.
</ParamField>

<ParamField path="variables" type="Record<string, string>" optional>
  Key-value pairs for variable substitution using `%variable%` syntax. Prevents sensitive data from appearing in logs.
</ParamField>

<ParamField path="modelName" type="AvailableModel" optional>
  Override the default LLM model for this action.
</ParamField>

<ParamField path="modelClientOptions" type="ClientOptions" optional>
  Model-specific configuration options.
  
  **Options:** `temperature`, `maxTokens`, `apiKey`
</ParamField>

<ParamField path="domSettleTimeoutMs" type="number" optional>
  Maximum time to wait for DOM to stabilize before attempting action.
  
  **Default:** `30000`
</ParamField>

<ParamField path="timeoutMs" type="number" optional>
  Maximum time to wait for the action to complete.
</ParamField>

<ParamField path="iframes" type="boolean" optional>
  Set to `true` if target element is within an iframe.
  
  **Default:** `false`
</ParamField>

<ParamField path="observeResult" type="ObserveResult" optional>
  Previously observed action to execute directly (enables self-healing).
</ParamField>

### Returns `Promise<ActResult>`

<ParamField path="success" type="boolean" required>
  Whether the action was completed successfully.
</ParamField>

<ParamField path="message" type="string" required>
  Details about the action's execution.
</ParamField>

<ParamField path="action" type="string" required>
  The action that was performed.
</ParamField>

```Example Response
{
  success: true,
  message: 'Action [scrollTo] performed successfully on selector: /html[1]',
  action: 'Scrollable area of the page where user can navigate to the pricing section or other parts of the page'
}
```

### Error Types

- **TimeoutError** - Action exceeded timeout limits
- **ElementNotFoundError** - Target element could not be located  
- **ActionFailedError** - Action could not be completed
- **StagehandError** - General Stagehand-specific errors

================================================
FILE: packages/docs/v2/references/agent.mdx
================================================
---
title: agent()
description: 'Complete API reference for the agent() method'
icon: 'robot'
---

<CardGroup cols={1}>
<Card title="Agent" icon="robot" href="/v2/basics/agent">
  See how to use agent() to create autonomous AI agents for multi-step browser workflows
</Card>
</CardGroup>

### Agent Creation

<Tabs>
<Tab title="TypeScript">

```typescript
// Create agent instance
const agent = stagehand.agent(config: AgentConfig): AgentInstance
```

**AgentConfig Interface:**
```typescript
interface AgentConfig {
  provider?: AgentProviderType;  // "openai" | "anthropic"
  model?: string;
  instructions?: string;
  options?: Record<string, unknown>;
  integrations?: (Client | string)[];
  tools?: ToolSet;
}
```

**AgentInstance Interface:**
```typescript
interface AgentInstance {
  execute: (instructionOrOptions: string | AgentExecuteOptions) => Promise<AgentResult>;
}
```

</Tab>
<Tab title="Python">

```python
# Create agent instance
agent = stagehand.agent(
    model: str,
    instructions: str = None,
    options: Dict[str, Any] = None
)
```

</Tab>
</Tabs>

### Agent Configuration

<ParamField path="provider" type="AgentProviderType" optional>
  AI provider for agent functionality.
  
  **Options:** `"anthropic"`, `"openai"`
</ParamField>

<ParamField path="model" type="string" optional>
  Specific model for agent execution.
  
  **Anthropic:** `"claude-sonnet-4-6"`, `"claude-sonnet-4-5-20250929"`
  
  **OpenAI:** `"computer-use-preview"`, `"gpt-4o"`
</ParamField>

<ParamField path="instructions" type="string" optional>
  System instructions defining agent behavior.
</ParamField>

<ParamField path="options" type="Record<string, unknown>" optional>
  Provider-specific configuration.
  
  **Common:** `apiKey`, `baseURL`, `organization`
</ParamField>

<ParamField path="integrations" type="(Client | string)[]" optional>
  MCP (Model Context Protocol) integrations for external tools and services.
  
  **Array of:** MCP server URLs (strings) or connected Client objects
</ParamField>

<ParamField path="tools" type="ToolSet" optional>
  Custom tool definitions to extend agent capabilities.
  
  **Format:** Object with tool name keys and tool definition values
</ParamField>

### Execute Method

<Tabs>
<Tab title="TypeScript">

```typescript
// String instruction
await agent.execute(instruction: string): Promise<AgentResult>

// With options
await agent.execute(options: AgentExecuteOptions): Promise<AgentResult>
```

**AgentExecuteOptions Interface:**
```typescript
interface AgentExecuteOptions {
  instruction: string;
  maxSteps?: number;
  autoScreenshot?: boolean;
  waitBetweenActions?: number;
  context?: string;
}
```

</Tab>
<Tab title="Python">

```python
# String instruction
await agent.execute(instruction: str) -> AgentResult

# With options dictionary
await agent.execute({
    "instruction": str,
    "max_steps": int = 20,
    "auto_screenshot": bool = True,
    "wait_between_actions": int = 0,
    "context": str = None
}) -> AgentResult
```

</Tab>
</Tabs>

### Execute Parameters

<ParamField path="instruction" type="string" required>
  High-level task description in natural language.
</ParamField>

<ParamField path="maxSteps" type="number" optional>
  Maximum number of actions the agent can take.
  
  **Default:** `20`
</ParamField>

<ParamField path="autoScreenshot" type="boolean" optional>
  Whether to take screenshots before each action.
  
  **Default:** `true`
</ParamField>

<ParamField path="waitBetweenActions" type="number" optional>
  Delay in milliseconds between actions.
  
  **Default:** `0`
</ParamField>

<ParamField path="context" type="string" optional>
  Additional context or constraints for the agent.
</ParamField>

### Response

**Returns:** `Promise<AgentResult>`

**AgentResult Interface:**
```typescript
interface AgentResult {
  success: boolean;
  message: string;
  actions: AgentAction[];
  completed: boolean;
  metadata?: Record<string, unknown>;
  usage?: {
    input_tokens: number;
    output_tokens: number;
    reasoning_tokens?: number;
    cached_input_tokens?: number;
    inference_time_ms: number;
  };
}
```

<Tabs>
<Tab title="TypeScript">

<ParamField path="success" type="boolean">
  Whether the task was completed successfully.
</ParamField>

<ParamField path="message" type="string">
  Description of the execution result and status.
</ParamField>

<ParamField path="actions" type="AgentAction[]">
  Array of individual actions taken during execution.
</ParamField>

<ParamField path="completed" type="boolean">
  Whether the agent believes the task is fully complete.
</ParamField>

<ParamField path="metadata" type="Record<string, unknown>" optional>
  Additional execution metadata and debugging information.
</ParamField>

<ParamField path="usage" type="object" optional>
  Token usage and performance metrics.
</ParamField>

</Tab>
<Tab title="Python">

<ParamField path="success" type="boolean">
  Whether the task was completed successfully.
</ParamField>

<ParamField path="message" type="string">
  Description of the execution result and status.
</ParamField>

<ParamField path="actions" type="AgentAction[]">
  Array of individual actions taken during execution.
</ParamField>

<ParamField path="completed" type="boolean">
  Whether the agent believes the task is fully complete.
</ParamField>

</Tab>
</Tabs>

### Example Response
```json
{
  "success": true,
  "message": "Task completed successfully",
  "actions": [
    {
      "action": "click",
      "selector": "button.primary",
      "text": "Submit"
    }
  ],
  "completed": true,
  "metadata": {
    "execution_time": 1000
  },
  "usage": {
    "input_tokens": 100,
    "output_tokens": 50,
    "reasoning_tokens": 12,
    "cached_input_tokens": 0,
    "inference_time_ms": 100
  }
}
```

================================================
FILE: packages/docs/v2/references/extract.mdx
================================================
---
title: extract()
description: 'Complete API reference for the extract() method'
icon: 'ufo-beam'
---

<CardGroup cols={1}>
<Card title="Extract" icon="ufo-beam" href="/v2/basics/extract">
  See how to use extract() to extract structured data from web pages
</Card>
</CardGroup>

### Method Signatures

<Tabs>
<Tab title="TypeScript">

```typescript
// With schema and options
await page.extract<T extends z.AnyZodObject>(options: ExtractOptions<T>): Promise<ExtractResult<T>>

// String instruction only
await page.extract(instruction: string): Promise<{ extraction: string }>

// No parameters (raw page content)
await page.extract(): Promise<{ pageText: string }>
```

**ExtractOptions Interface:**
```typescript
interface ExtractOptions<T extends z.AnyZodObject> {
  instruction?: string;
  schema?: T;
  modelName?: AvailableModel;
  modelClientOptions?: ClientOptions;
  domSettleTimeoutMs?: number;
  selector?: string;
  iframes?: boolean;
}

type ExtractResult<T> = z.infer<T>;
```

</Tab>
<Tab title="Python">

```python
# With schema and parameters
await page.extract(
    instruction: str = None,
    schema: BaseModel = None,
    selector: str = None,
    iframes: bool = None,
    model_name: AvailableModel = None,
    model_client_options: Dict = None,
    dom_settle_timeout_ms: int = None
) -> ExtractResult

# String instruction only
await page.extract(instruction: str) -> Dict[str, str]

# No parameters (raw page content)
await page.extract() -> Dict[str, str]
```

</Tab>
</Tabs>

### Parameters

<ParamField path="instruction" type="string" optional>
  Natural language description of what data to extract.
</ParamField>

<ParamField path="schema" type="z.ZodSchema | BaseModel" optional>
  Type schema defining the structure of data to extract. Ensures type safety and validation.
</ParamField>

<ParamField path="selector" type="string" optional>
  XPath selector to limit extraction scope. Reduces token usage and improves accuracy.
</ParamField>

<ParamField path="iframes" type="boolean" optional>
  Set to `true` if content exists within iframes.
  
  **Default:** `false`
</ParamField>

<ParamField path="modelName" type="AvailableModel" optional>
  Override the default LLM model for this extraction.
</ParamField>

<ParamField path="modelClientOptions" type="ClientOptions" optional>
  Model-specific configuration options.
</ParamField>

<ParamField path="domSettleTimeoutMs" type="number" optional>
  Maximum time to wait for DOM to stabilize.
  
  **Default:** `30000`
</ParamField>

### Response Types

<Tabs>
<Tab title="With Schema">
**Returns:** `Promise<ExtractResult<T>>` where T matches your schema

The returned object will be strictly typed according to your schema definition.
</Tab>

<Tab title="String Only">
**Returns:** `Promise<{ extraction: string }>`

Simple string extraction without schema validation.
</Tab>

<Tab title="No Parameters">
**Returns:** `Promise<{ pageText: string }>`

Raw accessibility tree representation of page content.
</Tab>
</Tabs>

### Code Examples

<Tabs>
<Tab title="Single Object">

<CodeGroup>
```typescript TypeScript
import { z } from 'zod';

// Schema definition
const ProductSchema = z.object({
  name: z.string(),
  price: z.number(),
  inStock: z.boolean()
});

// Extraction
const product = await page.extract({
  instruction: "extract product details",
  schema: ProductSchema
});
```

```python Python
from pydantic import BaseModel

# Schema definition
class Product(BaseModel):
    name: str
    price: float
    in_stock: bool

# Extraction
product = await page.extract(
    instruction="extract product details",
    schema=Product
)
```
</CodeGroup>

#### Example Response
```json
{
  "name": "Product Name",
  "price": 100,
  "inStock": true
}
```

</Tab>
<Tab title="Arrays">

<CodeGroup>
```typescript TypeScript
import { z } from 'zod';

// Schema definition
const ApartmentListingsSchema = z.object({
  apartments: z.array(z.object({
    address: z.string(),
    price: z.string(),
    bedrooms: z.number()
  }))
});

// Extraction
const listings = await page.extract({
  instruction: "extract all apartment listings", 
  schema: ApartmentListingsSchema
});
```

```python Python
from pydantic import BaseModel
from typing import List

# Schema definition
class Apartment(BaseModel):
    address: str
    price: str
    bedrooms: int

class ApartmentListings(BaseModel):
    apartments: List[Apartment]

# Extraction
listings = await page.extract(
    instruction="extract all apartment listings",
    schema=ApartmentListings
)
```
</CodeGroup>

#### Example Response
```json
{
  "apartments": [
    {
      "address": "123 Main St",
      "price": "$100,000",
      "bedrooms": 3
    },
    {
      "address": "456 Elm St",
      "price": "$150,000",
      "bedrooms": 2
    }
  ]
}
```

</Tab>
<Tab title="URLs">

<CodeGroup>
```typescript TypeScript
import { z } from 'zod';

// Schema definition
const NavigationSchema = z.object({
  links: z.array(z.object({
    text: z.string(),
    url: z.string().url()  // URL validation
  }))
});

// Extraction
const links = await page.extract({
  instruction: "extract navigation links",
  schema: NavigationSchema
});
```

```python Python
from pydantic import BaseModel, HttpUrl
from typing import List

# Schema definition
class NavLink(BaseModel):
    text: str
    url: HttpUrl  # URL validation

class Navigation(BaseModel):
    links: List[NavLink]

# Extraction
links = await page.extract(
    instruction="extract navigation links", 
    schema=Navigation
)
```
</CodeGroup>

#### Example Response
```json
{
  "links": [
    {
      "text": "Home",
      "url": "https://example.com"
    }
  ]
}
```

</Tab>
<Tab title="Scoped">

<CodeGroup>
```typescript TypeScript
import { z } from 'zod';

const ProductSchema = z.object({
  name: z.string(),
  price: z.number(),
  description: z.string()
});

// Extract from specific page section
const data = await page.extract({
  instruction: "extract product info from this section",
  selector: "xpath=/html/body/div/div",
  schema: ProductSchema
});
```

```python Python
from pydantic import BaseModel

class Product(BaseModel):
    name: str
    price: float
    description: str

# Extract from specific page section
data = await page.extract(
    instruction="extract product info from this section",
    selector="xpath=/html/body/div/div",
    schema=Product
)
```
</CodeGroup>

#### Example Response
```json
{
  "name": "Product Name",
  "price": 100,
  "description": "Product description"
}
```

</Tab>
<Tab title="Schema-less">

<CodeGroup>
```typescript TypeScript
// String only extraction
const title = await page.extract("get the page title");
// Returns: { extraction: "Page Title" }

// Raw page content
const content = await page.extract();
// Returns: { pageText: "Accessibility Tree: ..." }
```

```python Python
# String only extraction
title = await page.extract("get the page title")
# Returns: {"extraction": "Page Title"}

# Raw page content
content = await page.extract()
# Returns: {"pageText": "Accessibility Tree: ..."}
```
</CodeGroup>

#### Example Response
```json
{
  "extraction": "Page Title"
}
```

</Tab>
<Tab title="Advanced">

<CodeGroup>
```typescript TypeScript
import { z } from 'zod';

// Schema with descriptions and validation
const ProductSchema = z.object({
  price: z.number().describe("Product price in USD"),
  rating: z.number().min(0).max(5).describe("Customer rating out of 5"),
  available: z.boolean().describe("Whether product is in stock"),
  tags: z.array(z.string()).optional()
});

// Nested schema
const EcommerceSchema = z.object({
  product: z.object({
    name: z.string(),
    price: z.object({
      current: z.number(),
      original: z.number().optional()
    })
  }),
  reviews: z.array(z.object({
    rating: z.number(),
    comment: z.string()
  }))
});
```

```python Python
from pydantic import BaseModel, Field
from typing import Optional, List

# Schema with descriptions and validation
class Product(BaseModel):
    price: float = Field(description="Product price in USD")
    rating: float = Field(ge=0, le=5, description="Customer rating out of 5")
    available: bool = Field(description="Whether product is in stock")
    tags: Optional[List[str]] = None

# Nested schema
class Price(BaseModel):
    current: float
    original: Optional[float] = None

class Review(BaseModel):
    rating: int
    comment: str

class ProductDetails(BaseModel):
    name: str
    price: Price

class EcommerceData(BaseModel):
    product: ProductDetails
    reviews: List[Review]
```
</CodeGroup>

#### Example Response
```json
{
  "product": {
    "name": "Product Name",
    "price": {
      "current": 100,
      "original": 120
    }
  },
  "reviews": [
    {
      "rating": 4,
      "comment": "Great product!"
    }
  ]
}
```

</Tab>
</Tabs>

================================================
FILE: packages/docs/v2/references/observe.mdx
================================================
---
title: observe()
description: 'Complete API reference for the observe() method'
icon: 'magnifying-glass'
---

<CardGroup cols={1}>
<Card title="Observe" icon="magnifying-glass" href="/v2/basics/observe">
  See how to use observe() to discover actionable elements and analyze web page structure
</Card>
</CardGroup>

### Method Signatures

<Tabs>
<Tab title="TypeScript">

```typescript
// With ObserveOptions
await page.observe(options: ObserveOptions): Promise<ObserveResult[]>

// String instruction shorthand
await page.observe(instruction: string): Promise<ObserveResult[]>
```

**ObserveOptions Interface:**
```typescript
interface ObserveOptions {
  instruction?: string;
  modelName?: AvailableModel;
  modelClientOptions?: ClientOptions;
  domSettleTimeoutMs?: number;
  drawOverlay?: boolean;
  iframes?: boolean;
}
```

</Tab>
<Tab title="Python">

```python
# With parameters
await page.observe(
    instruction: str,
    dom_settle_timeout_ms: int = None,
    iframes: bool = None,
    model_name: AvailableModel = None,
    model_client_options: Dict = None
) -> List[ObserveResult]
```

</Tab>
</Tabs>

### Parameters

<ParamField path="instruction" type="string" optional>
  Natural language description of elements or actions to discover.
</ParamField>

<ParamField path="modelName" type="AvailableModel" optional>
  Override the default LLM model for this observation.
</ParamField>

<ParamField path="modelClientOptions" type="ClientOptions" optional>
  Model-specific configuration options.
</ParamField>

<ParamField path="domSettleTimeoutMs" type="number" optional>
  Maximum time to wait for DOM to stabilize before analysis.
  
  **Default:** `30000`
</ParamField>

<ParamField path="drawOverlay" type="boolean" optional>
  Whether to draw visual overlays on discovered elements (debugging).
  
  **Default:** `false`
</ParamField>

<ParamField path="iframes" type="boolean" optional>
  Set to `true` to search within iframes.
  
  **Default:** `false`
</ParamField>

### Response

**Returns:** `Promise<ObserveResult[]>`

Array of discovered actionable elements, ordered by relevance.

**ObserveResult Interface:**
```typescript
interface ObserveResult {
  selector: string;        // XPath selector to locate element
  description: string;     // Human-readable description
  method?: string;         // Suggested action method
  arguments?: string[];    // Additional action parameters
}
```

<ParamField path="selector" type="string">
  XPath selector that precisely locates the element.
</ParamField>

<ParamField path="description" type="string">
  Human-readable description of the element and its purpose.
</ParamField>

<ParamField path="method" type="string" optional>
  Suggested interaction method: `"click"`, `"fill"`, `"selectOptionFromDropdown"`, `"nextChunk"`, `"scrollTo"`, `"prevChunk"`.
</ParamField>

<ParamField path="arguments" type="string[]" optional>
  Additional parameters for the suggested action.
</ParamField>


### Code Examples

<CodeGroup>
```typescript TypeScript
// Basic element discovery
const buttons = await page.observe("find all clickable buttons");
const formFields = await page.observe("locate form input fields");

// Advanced configuration
const elements = await page.observe({
  instruction: "find important call-to-action buttons",
  modelName: "gpt-4.1-mini",
  domSettleTimeoutMs: 45000,
  drawOverlay: true
});

// Working with results
const [loginButton] = await page.observe("find the login button");
if (loginButton) {
  console.log("Found:", loginButton.description);
  console.log("Selector:", loginButton.selector);
  await page.act(loginButton); // Execute the action
}

// Filter results
const submitButtons = await page.observe("find all submit buttons");
const primarySubmit = submitButtons.find(btn => 
  btn.description.toLowerCase().includes('primary')
);

// Iframe search
const iframeElements = await page.observe({
  instruction: "find form fields inside the iframe",
  iframes: true
});
```

```python Python
# Basic element discovery
buttons = await page.observe("find all clickable buttons")
form_fields = await page.observe("locate the form fields")

# Advanced configuration  
elements = await page.observe(
    instruction="find important call-to-action buttons",
    model_name="gpt-4.1-mini",
    dom_settle_timeout_ms=45000
)

# Working with results
login_buttons = await page.observe("find the login button")
if login_buttons:
    button = login_buttons[0]
    print("Found:", button.description)
    print("Selector:", button.selector)
    await page.act(button)  # Execute the action

# Filter results
submit_buttons = await page.observe("find all submit buttons")
primary_submit = next((
    btn for btn in submit_buttons 
    if 'primary' in btn.description.lower()
), None)

# Iframe search
iframe_elements = await page.observe(
    instruction="find the form fields inside the iframe",
    iframes=True
)
```
</CodeGroup>

### Integration Patterns

<CodeGroup>
```typescript TypeScript
// Observe → Act workflow
const actions = await page.observe("find checkout elements");
for (const action of actions) {
  await page.act(action);
  await page.waitForTimeout(1000);
}

// Observe → Extract workflow
const tables = await page.observe("find data tables");
if (tables.length > 0) {
  const data = await page.extract({
    instruction: "extract the table data",
    selector: tables[0].selector,
    schema: DataSchema
  });
}

// Element validation
const requiredElements = await page.observe("find the login form");
if (requiredElements.length === 0) {
  throw new Error("Login form not found");
}
```

```python Python
# Observe → Act workflow  
actions = await page.observe("find checkout elements")
for action in actions:
    await page.act(action)
    await page.wait_for_timeout(1000)

# Observe → Extract workflow
tables = await page.observe("find data tables")
if tables:
    data = await page.extract(
        instruction="extract the table data",
        selector=tables[0].selector,
        schema=DataSchema
    )

# Element validation
required_elements = await page.observe("find login form")
if not required_elements:
    raise Exception("Login form not found")
```
</CodeGroup>

================================================
FILE: packages/docs/v2/references/stagehand.mdx
================================================
---
title: 'Stagehand'
description: 'Complete API reference for initializing Stagehand'
icon: 'wand-magic-sparkles'
---

### Constructor Signature

<Tabs>
<Tab title="TypeScript">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  // ... other options
});
await stagehand.init();
```

**ConstructorParams Interface:**
```typescript
interface ConstructorParams {
  env: "BROWSERBASE" | "LOCAL";
  apiKey?: string;
  projectId?: string;
  verbose?: 0 | 1 | 2;
  llmProvider?: LLMProvider;
  logger?: (message: LogLine) => void | Promise<void>;
  domSettleTimeoutMs?: number;
  browserbaseSessionCreateParams?: Omit<Browserbase.Sessions.SessionCreateParams, "projectId"> & { projectId?: string };
  enableCaching?: boolean;
  browserbaseSessionID?: string;
  modelName?: AvailableModel;
  llmClient?: LLMClient;
  modelClientOptions?: ClientOptions;
  systemPrompt?: string;
  useAPI?: boolean;
  waitForCaptchaSolves?: boolean;
  localBrowserLaunchOptions?: LocalBrowserLaunchOptions;
  logInferenceToFile?: boolean;
  selfHeal?: boolean;
  disablePino?: boolean;
  experimental?: boolean;
}
```

</Tab>
<Tab title="Python">

```python
from stagehand import Stagehand

stagehand = Stagehand(
    env: Literal["BROWSERBASE", "LOCAL"] = "BROWSERBASE",
    api_key: str = None,
    project_id: str = None,
    api_url: str = None,
    model_name: str = None,
    model_api_key: str = None,
    model_client_options: Dict[str, Any] = None,
    verbose: int = 1,
    logger: Callable = None,
    use_rich_logging: bool = True,
    dom_settle_timeout_ms: int = 3000,
    browserbase_session_create_params: Dict = None,
    browserbase_session_id: str = None,
    enable_caching: bool = False,
    self_heal: bool = True,
    wait_for_captcha_solves: bool = False,
    system_prompt: str = None,
    local_browser_launch_options: Dict[str, Any] = None,
    use_api: bool = True,
    experimental: bool = False,
)
await stagehand.init()
```

</Tab>
</Tabs>

<CardGroup cols={1}>
<Card title="Model Configuration" icon="brain" href="/configuration/models">
  Learn how to configure different LLM models for Stagehand
</Card>
</CardGroup>

### Parameters

#### Required Parameters

<ParamField path="env" type="'BROWSERBASE' | 'LOCAL'" required>
  The environment to use for Stagehand.

  - `BROWSERBASE` - Run browser on Browserbase cloud infrastructure
  - `LOCAL` - Run browser locally on your machine

  **Default:** `"BROWSERBASE"` (Python only)
</ParamField>

#### Browserbase Configuration

<ParamField path="apiKey" type="string" optional>
  Your Browserbase API key. Required when `env` is `BROWSERBASE`.
</ParamField>

<ParamField path="projectId" type="string" optional>
  Your Browserbase project ID. Required when `env` is `BROWSERBASE`.
</ParamField>

<ParamField path="browserbaseSessionID" type="string" optional>
  The ID of an existing Browserbase session to resume. Useful for continuing previous browser sessions.
</ParamField>

<ParamField path="browserbaseSessionCreateParams" type="object" optional>
  Parameters to use when creating a Browserbase session. See [Browserbase API documentation](https://docs.browserbase.com/reference/api/create-a-session) for available options.
</ParamField>

<ParamField path="waitForCaptchaSolves" type="boolean" optional>
  Wait for captchas to be solved after navigation when using Browserbase environment.

  **Default:** `false`
</ParamField>

#### Local Browser Configuration

<ParamField path="localBrowserLaunchOptions" type="LocalBrowserLaunchOptions" optional>
  Configuration options for launching a local browser. Only used when `env` is `LOCAL`.

  See the [full interface definition](https://github.com/browserbase/stagehand/blob/v2/types/stagehand.ts#L174) for all available options.
</ParamField>

#### LLM Configuration

<CardGroup cols={1}>
<Card title="Model Configuration" icon="brain" href="/configuration/models">
  Learn how to configure different LLM models for Stagehand
</Card>
</CardGroup>

<ParamField path="modelName" type="AvailableModel" optional>
  The LLM model to use for Stagehand operations.

  **Examples:** `gpt-4o`, `gpt-4o-mini`, `claude-sonnet-4-6`

  **Python Default:** `"gpt-4o"`
</ParamField>

<ParamField path="modelApiKey" type="string" optional>
  API key for the LLM model provider. **Python only.**

  In TypeScript, use `modelClientOptions.apiKey` instead.
</ParamField>

<ParamField path="llmProvider" type="LLMProvider" optional>
  The LLM provider to use for Stagehand. Custom provider implementation. **TypeScript only.**
</ParamField>

<ParamField path="llmClient" type="LLMClient" optional>
  Custom LLM client instance to use for Stagehand operations. **TypeScript only.**
</ParamField>

<ParamField path="modelClientOptions" type="ClientOptions" optional>
  LLM client configuration options. Useful for parameterizing LLM API keys and other settings.

  **Common options:** `apiKey` (TypeScript), `api_base`, `temperature`, `maxTokens`
</ParamField>

<ParamField path="enableCaching" type="boolean" optional>
  Enable caching of LLM responses to reduce API calls and costs.

  **TypeScript Default:** `true`
  **Python Default:** `false`
</ParamField>

#### Logging and Debugging

<Note>
**Security tip:** Use `verbose: 0` when your automation handles secrets to prevent sensitive data from appearing in logs.
</Note>

<ParamField path="verbose" type="0 | 1 | 2" optional>
  The verbosity level of the Stagehand logger.

  - `0` - Minimal (ERROR only)
  - `1` - Medium (INFO level)
  - `2` - Detailed (DEBUG level)

  **Default:** `1`
</ParamField>

<ParamField path="logger" type="(message: LogLine) => void | Promise<void>" optional>
  Custom logger function to handle log messages from Stagehand.
</ParamField>

<ParamField path="useRichLogging" type="boolean" optional>
  Whether to use Rich for colorized logging output. **Python only.**

  **Default:** `true`
</ParamField>

<ParamField path="disablePino" type="boolean" optional>
  Disable Pino logger. Helpful for Next.js or test environments where Pino causes issues. **TypeScript only.**

  **Default:** `false`
</ParamField>

<ParamField path="logInferenceToFile" type="boolean" optional>
  Log LLM inference details to a file for debugging purposes. **TypeScript only.**

  **Default:** `false`
</ParamField>

#### Performance and Behavior

<ParamField path="domSettleTimeoutMs" type="number" optional>
  Default timeout to wait for the DOM to settle before performing operations.

  **TypeScript Default:** `10000` (10 seconds)
  **Python Default:** `3000` (3 seconds)
</ParamField>

<ParamField path="selfHeal" type="boolean" optional>
  Enable self-healing capabilities to automatically recover from failures.

  **Python Default:** `true`
</ParamField>

<ParamField path="systemPrompt" type="string" optional>
  Customize the Stagehand system prompt used for LLM interactions.
</ParamField>

<ParamField path="useAPI" type="boolean" optional>
  Offload Stagehand method calls to the Stagehand API.

  **Default:** `true`
</ParamField>

<ParamField path="experimental" type="boolean" optional>
  Enable the latest experimental features. Use with caution in production.

  **Default:** `false`
</ParamField>

### Returns `InitResult`

After calling `stagehand.init()`, you receive an `InitResult` object:

<ParamField path="debugUrl" type="string" required>
  URL for debugging the browser session (e.g., Chrome DevTools).
</ParamField>

<ParamField path="sessionUrl" type="string" required>
  URL of the browser session (especially useful with Browserbase).
</ParamField>

<ParamField path="sessionId" type="string" required>
  Unique identifier for the browser session.
</ParamField>

================================================
FILE: packages/docs/v3/basics/act.mdx
================================================
---
title: Act
description: 'Interact with a web page'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## What is `act()`?
``` typescript
await stagehand.act("click on add to cart")
```
`act` enables Stagehand to perform **individual** actions on a web page. Use it to build self-healing and deterministic automations that adapt to website changes. 

## Why use `act()`?

<CardGroup cols={2}>
  <Card title="Natural Language Instructions" icon="wand-magic-sparkles" href="#using-act">
    Write automation in plain English. No selectors or complex syntax.
  </Card>
  <Card title="Precise Control" icon="crosshairs" href="#best-practices">
    Build automations step by step. Define exactly what happens at every moment.
  </Card>
  <Card title="Self-Healing" icon="bandage" href="#ensure-reliable-actions">
    Actions automatically adapt when websites change.
  </Card>
  <Card title="Caching" icon="repeat" href="#reduce-model-costs">
    Cache actions to avoid LLM calls and ensure consistent execution across runs.
  </Card>
</CardGroup>


## Using `act()`

Use `act` to perform single actions in your automation. Here's how to click a button:

```typescript
await page.goto("https://example-store.com");
await stagehand.act("click the add to cart button");
```

<Note>
**iFrame and Shadow DOM Support** Stagehand automatically handles iFrame traversal and shadow DOM elements without requiring additional configuration.
</Note>

With `act`, breaking complex actions into small, single-step actions works best. If you need to orchestrate multi-step flows, use multiple `act` commands or `agent`.

<Accordion title="Suggested actions">

| Action | Example instruction |
|--------|---------------------|
| Click | `click the button` |
| Fill | `fill the field with <value>` |
| Type | `type <text> into the search box` |
| Press | `press <key> in the search field` |
| Scroll | `scroll to <position>` |
| Select from dropdown | `select <value> from the dropdown` |
</Accordion>

### Return value of `act()`?
When you use `act()`, Stagehand will return a `Promise<ActResult>` with the following structure:
``` typescript
{
  success: true,
  message: 'Action [click] performed successfully on selector: xpath=/html[1]/body[1]/div[1]/span[1] → Action [click] performed successfully on selector: xpath=/html[1]/body[1]/div[2]/div[1]/section[1]/div[1]/div[1]/div[25]',
  actionDescription: 'Favorite Colour',
  actions: [
    {
      selector: 'xpath=/html[1]/body[1]/div[1]/span[1]',
      description: 'Favorite Colour',
      method: 'click',
      arguments: []
    },
    {
      selector: 'xpath=/html[1]/body[1]/div[2]/div[1]/section[1]/div[1]/div[1]/div[25]',
      description: 'Peach',
      method: 'click',
      arguments: []
    }
  ]
}
```


<Tabs>
<Tab title="Do this" icon="check">
Break your task into single-step actions.

```typescript
// Break it into single-step actions
await stagehand.act("open the filters panel");
await stagehand.act("choose 4-star rating");
await stagehand.act("click the apply button");
```
</Tab>

<Tab title="Don't do this" icon="xmark">
For multi-step tasks, use [`agent()`](/basics/agent) instead.

```typescript
// Too complex - trying to do multiple things at once
await stagehand.act("open the filters panel, choose 4-star rating, and click apply");
```
</Tab>
</Tabs>

## Advanced Configuration

You can pass additional options to configure the model, timeout, variables, and target page:

```typescript
// Custom model configuration
await stagehand.act("choose 'Peach' from the favorite color dropdown", {
  model: {
    modelName: "google/gemini-2.5-flash",
    apiKey: process.env.GEMINI_API_KEY
  },
  timeout: 10000
});
```

### Server-side Caching

<Note>
`serverCache` only works when running with `env: "BROWSERBASE"`. It has no effect in local environments.
</Note>

When running on Browserbase, Stagehand automatically caches `act()` results server-side. Repeated calls with the same inputs return instantly without consuming LLM tokens. Caching is enabled by default and can be controlled globally on the constructor or overridden per call:

```typescript
// Disable server-side caching for the entire instance
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  serverCache: false,
});

// Or disable it for a single call
await stagehand.act("click the login button", { serverCache: false });

// Check whether a result was served from cache
const result = await stagehand.act("click the login button");
console.log(result.cacheStatus); // "HIT", "MISS", or undefined
```

### Using with Custom Pages

You can use `act()` with pages from other browser automation libraries like Puppeteer, Playwright, or Patchright by passing the `page` option:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import puppeteer from "puppeteer-core";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
});
await stagehand.init();

// Connect with Puppeteer
const browser = await puppeteer.connect({
  browserWSEndpoint: stagehand.connectURL(),
  defaultViewport: null,
});

const pages = await browser.pages();
const customPage = pages[0];

await customPage.goto("https://www.example.com/blog");

// Use act with the custom Puppeteer page
await stagehand.act("click the next page button", {
  page: customPage
});
```

This works with:
- **Puppeteer**: Pass Puppeteer Page objects
- **Playwright**: Pass Playwright Page objects
- **Patchright**: Pass Patchright Page objects
- **Stagehand Page**: Use `stagehand.context.pages()[0]` or `context.activePage()` (default)

<Card title="Complete API Reference" icon="book" href="/v3/references/act">
  See the full `act()` reference for detailed parameter documentation, return values, and advanced examples.
</Card>


## Best practices

### Ensure reliable actions

Use `observe()` to discover candidate actions on the current page and plan reliably. It returns a list of suggested actions (with selector, description, method, and arguments). You can pass an observed action directly to `act` to execute it.

```typescript
const [action] = await stagehand.observe("click the login button");

if (action) {
  await stagehand.act(action);
}
```

<Card title="Analyze pages with observe()" icon="magnifying-glass" iconType="sharp-solid" href="/v3/basics/observe">
  Plan actions with `observe()` before executing with `act`.
</Card>

### Reduce model costs

Enable automatic action caching by specifying a `cacheDir` when initializing Stagehand. The first time an action runs, it's cached. Subsequent runs reuse the cached action without LLM calls.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Enable caching by specifying a cache directory
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "act-cache" // Actions are automatically cached here
});

await stagehand.init();
const page = stagehand.context.pages()[0];

// First run - makes LLM call and caches the action
await stagehand.act("click the login button");
```

<Note>
Caching persists across script executions. The first time you run your script, actions are cached to your local filesystem. On subsequent runs, cached actions are reused automatically, significantly reducing costs and improving performance.
</Note>

<Card title="Complete caching guide" icon="database" iconType="sharp-solid" href="/v3/best-practices/caching">
  Learn advanced caching techniques and patterns for optimal performance.
</Card>

### Secure your automations

Variables are **not shared with LLM providers**. Use them for passwords, API keys, and other sensitive data.

<Note>
Load sensitive data from environment variables using `.env` files. Never hardcode API keys, passwords, or other secrets directly in your code.
</Note>

```typescript
// Variables use %variableName% syntax in the instruction
await stagehand.act("type %username% into the email field", {
  variables: { username: "user@example.com" }
});

await stagehand.act("type %password% into the password field", {
  variables: { password: process.env.USER_PASSWORD }
});

await stagehand.act("click the login button");
```

<Warning>
When handling sensitive data, set `verbose: 0` in your Stagehand configuration to prevent secrets from appearing in logs. See the [configuration guide](/configuration/browser) for more details.
</Warning>

<Card title="User Data Best Practices" icon="shield-check" iconType="sharp-solid" href="/v3/best-practices/user-data">
  Complete guide to securing your browser automations with best practices and configurations.
</Card>

## Troubleshooting

<AccordionGroup>


<Accordion title="Method not supported">
**Problem**: `act` fails with "method not supported" error

**Solutions**:
- Use clear and detailed instructions for what you want to accomplish
- Review our [evals](https://stagehand.dev/evals) to find the best models for your use case
- Use [`observe()`](/basics/observe) and verify the resulting action is within a list of expected actions

**Solution 1: Validate with observe**

```typescript
const prompt = "click the submit button";
const expectedMethod = "click";

try {
  await stagehand.act(prompt);
} catch (error) {
  if (error.message.includes("method not supported")) {
    // Observe the same prompt to get the planned action
    const [action] = await stagehand.observe(prompt);

    if (action && action.method === expectedMethod) {
      await stagehand.act(action);
    } else {
      throw new Error(`Unsupported method: expected "${expectedMethod}", got "${action?.method}"`);
    }
  } else {
    throw error;
  }
}
```

**Solution 2: Retry with exponential backoff**

```typescript
// Retry with exponential backoff for intermittent issues
const prompt = "click the submit button";
const maxRetries = 3;

for (let attempt = 0; attempt <= maxRetries; attempt++) {
  try {
    await stagehand.act(prompt, { timeout: 10000 + (attempt * 5000) });
    break; // Success, exit retry loop
  } catch (error) {
    if (error.message.includes("method not supported") && attempt < maxRetries) {
      // Exponential backoff: wait 2^attempt seconds
      const delay = Math.pow(2, attempt) * 1000;
      console.log(`Retry ${attempt + 1}/${maxRetries} after ${delay}ms`);
      await new Promise(resolve => setTimeout(resolve, delay));
    } else {
      throw error;
    }
  }
}
```

</Accordion>

<Accordion title="Action failed or timed out">
**Problem**: `act` times out or fails to complete action (often due to element not found)

**Solutions**:
- Ensure page has fully loaded
- Check if content is in iframes: [Learn more about working with iframes](/best-practices/working-with-iframes)
- Increase action timeout
- Use `observe()` first to verify element exists

```typescript
// Handle timeout and element not found issues
try {
  await stagehand.act("click the submit button", { timeout: 30000 });
} catch (error) {
  // Check if page is fully loaded
  await page.waitForLoadState('domcontentloaded');

  // Use observe to check element state
  const [element] = await stagehand.observe("find the submit button");

  if (element) {
    console.log("Element found, trying more specific instruction");
    await stagehand.act("click the submit button at the bottom of the form");
  } else {
    console.log("Element not found, trying alternative selector");
    await stagehand.act("click the button with text 'Submit'");
  }
}
```
</Accordion>

<Accordion title="Incorrect element selected">
**Problem**: `act` performs action on wrong element

**Solutions**:
- Be more specific in instructions: include visual cues, position, or context
- Use `observe()` to preview which element will be selected
- Add contextual information: "the search button in the header"
- Use unique identifiers when available

```typescript
// More precise element targeting
// Instead of:
await stagehand.act("click the button");

// Use specific context:
await stagehand.act("click the red 'Delete' button next to the user John Smith");

// Or preview with observe first:
const [action] = await stagehand.observe("click the submit button in the checkout form");
if (action.description.includes("checkout")) {
  await stagehand.act(action);
}
```
</Accordion>


</AccordionGroup>

## Next steps

<CardGroup cols={2}>

  <Card title="Orchestrate complex workflows with Agent" icon="robot" iconType="sharp-solid" href="/v3/basics/agent">
    Use `Agent` to autonomously execute multi-step tasks and complex workflows.
  </Card>

   <Card title="Caching actions" icon="bolt" iconType="sharp-solid" href="/v3/best-practices/caching">
    Speed up repeated automations by caching actions.
  </Card>

  <Card title="Extract data with extract()" icon="table" iconType="sharp-solid" href="/v3/basics/extract">
    Use `extract` with a data schema to pull clean, typed data from any page.
  </Card>

  <Card title="Preview actions with observe()" icon="magnifying-glass" iconType="sharp-solid" href="/v3/basics/observe">
    Preview actions with `observe()` before executing them.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v3/basics/agent.mdx
================================================
---
title: Agent
description: 'Automate complex workflows with AI powered browser agents'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## What is `agent()?`

``` typescript
await agent.execute("apply for a job at browserbase")
```
`agent` turns high level tasks into **fully autonomous** browser workflows. You can customize the agent by specifying the LLM provider and model, setting custom instructions for behavior, and configuring max steps.

<img src="/images/agent.gif" alt="Agent" />

## Why use `agent()`?

<CardGroup cols={2}>
  <Card title="Multi-Step Workflows" icon="route" href="#agent-execution-configuration">
    Execute complex sequences automatically.
  </Card>
  <Card title="Visual Understanding" icon="eye" href="/v3/best-practices/computer-use">
    Sees and understands web interfaces like humans do using computer vision.
  </Card>
</CardGroup>

## Using `agent()`

There are three ways to create agents in Stagehand:
1. Use a Computer Use Agent (CUA mode)
2. Use Agent with any LLM (DOM mode)
3. Use Agent with vision and DOM (Hybrid mode)

### Feature Availability

Some advanced features are only available with certain agent modes:

| Feature                  | CUA | DOM | Hybrid |
|:-------------------------|:---:|:---:|:------:|
| Basic execution          | ✅  | ✅  | ✅     |
| Custom tools             | ✅  | ✅  | ✅     |
| MCP integrations         | ✅  | ✅  | ✅     |
| System prompt            | ✅  | ✅  | ✅     |
| Variables                | ❌  | ✅  | ✅     |
| Streaming                | ❌  | ✅  | ✅     |
| Callbacks                | ❌  | ✅  | ✅     |
| Abort signal             | ❌  | ✅  | ✅     |
| Message continuation     | ❌  | ✅  | ✅     |
| Exclude tools            | ❌  | ✅  | ✅     |
| Structured output        | ❌  | ✅  | ✅     |
| DOM-based actions        | ❌  | ✅  | ✅     |
| Coordinate-based actions | ✅  | ❌  | ✅     |
| Visual cursor highlight  | ✅  | ❌  | ✅     |

### Computer Use Agents

You can use specialized computer use models from Google, OpenAI, Anthropic, or Microsoft as shown below, with `mode` set to `"cua"`. To compare the performance of different computer use models, you can visit our [evals page](https://www.stagehand.dev/agent-evals).

<Warning>
**Deprecation Notice:** The `cua: true` option is deprecated and will be removed in a future version. Use `mode: "cua"` instead.
</Warning>

<CodeGroup>
```typescript Google
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "google/gemini-2.5-computer-use-preview-10-2025",
        apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
    },
    systemPrompt: "You are a helpful assistant...",
});

await agent.execute({
    instruction: "Go to Hacker News and find the most controversial post from today, then read the top 3 comments and summarize the debate.",
    maxSteps: 20,
    highlightCursor: true
})
```

```typescript OpenAI
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "openai/computer-use-preview",
        apiKey: process.env.OPENAI_API_KEY
    },
    systemPrompt: "You are a helpful assistant...",
});

await agent.execute({
    instruction: "Go to Hacker News and find the most controversial post from today, then read the top 3 comments and summarize the debate.",
    maxSteps: 20,
    highlightCursor: true
})
```
```typescript Anthropic
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "anthropic/claude-sonnet-4-20250514",
        apiKey: process.env.ANTHROPIC_API_KEY
    },
    systemPrompt: "You are a helpful assistant...",
});

await agent.execute({
    instruction: "Go to Hacker News and find the most controversial post from today, then read the top 3 comments and summarize the debate.",
    maxSteps: 20,
    highlightCursor: true
})
```
</CodeGroup>

<Callout icon="code" color="#6ec202" iconType="regular">View or run the example template [here](https://www.browserbase.com/templates/gemini-cua)</Callout>

### Use Stagehand Agent with Any LLM

Use the agent without specifying a provider to utilize any model or LLM provider:

<Note>Non CUA agents are currently only supported in TypeScript</Note>

```typescript TypeScript
const agent = stagehand.agent();
await agent.execute("apply for a job at Browserbase")
```
<Card title="Available Agent Models" icon="robot" href="/v3/configuration/models#agent-models-with-cua-support">
  Check out the guide on how to use different models with Stagehand Agent.
</Card>

### Hybrid Mode

Both DOM and CUA modes have their strengths and weaknesses. Hybrid mode combines them, giving the agent access to both coordinate-based and DOM-based tools to better account for where each may fall short.

<Warning>
**Model Requirements:** Hybrid mode requires models that can reliably perform coordinate-based actions from screenshots. The following models are recommended:
- **Google:** `google/gemini-3-flash-preview`
- **Anthropic:** `anthropic/claude-sonnet-4-20250514`, `anthropic/claude-sonnet-4-5-20250929`, `anthropic/claude-haiku-4-5-20251001`

Other models may not reliably produce accurate coordinates for clicking and typing.

</Warning>

<Note>Hybrid mode requires `experimental: true` in your Stagehand constructor.</Note>

<CodeGroup>
```typescript Hybrid Mode with Google
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  experimental: true, // Required for hybrid mode
});
await stagehand.init();

const agent = stagehand.agent({
  mode: "hybrid",
  model: "google/gemini-3-flash-preview",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

await agent.execute({
  instruction: "Click the sign up button and fill out the registration form",
  maxSteps: 20,
});
```

```typescript Hybrid Mode with Anthropic
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  experimental: true, // Required for hybrid mode
});
await stagehand.init();

const agent = stagehand.agent({
  mode: "hybrid",
  model: "anthropic/claude-haiku-4-5-20251001",
  systemPrompt: "You are a helpful assistant that interacts with web pages visually.",
});

await agent.execute({
  instruction: "Navigate the page and interact with the form elements",
  maxSteps: 15,
  highlightCursor: true, // Enabled by default in hybrid mode
});
```
</CodeGroup>

### Return value of `agent()`?

When you use `agent()`, Stagehand will return a `Promise<AgentResult>` with the following structure:

```typescript
{
  success: true,
  message: "The first name and email fields have been filled successfully with 'John' and 'john@example.com'.",
  actions: [
    {
      type: 'ariaTree',
      reasoning: undefined,
      taskCompleted: true,
      pageUrl: 'https://example.com',
      timestamp: 1761598722055
    },
    {
      type: 'act',
      reasoning: undefined,
      taskCompleted: true,
      action: 'type "John" into the First Name textbox',
      playwrightArguments: {...},
      pageUrl: 'https://example.com',
      timestamp: 1761598731643
    },
    {
      type: 'close',
      reasoning: "The first name and email fields have been filled successfully.",
      taskCompleted: true,
      taskComplete: true,
      pageUrl: 'https://example.com',
      timestamp: 1761598732861
    }
  ],
  completed: true,
  // Only populated when `output` schema is provided (DOM/Hybrid modes only)
  output: {
    price: "$199",
    airline: "Delta"
  },
  usage: {
    input_tokens: 2040,
    output_tokens: 28,
    reasoning_tokens: 12,
    cached_input_tokens: 0,
    inference_time_ms: 14079
  }
}
```

## Customizing Agent Tools

Stagehand agents come with built-in tools for browser automation, but you can customize the toolset by adding your own custom tools or excluding built-in ones.

### Adding Custom Tools

Custom tools enhance agents with additional capabilities for more granular control and better performance. Unlike MCP integrations, custom tools are defined inline and execute directly within your application.

<Note>Custom tools provide a cleaner, more performant alternative to MCP integrations when you need specific functionality.</Note>

#### Defining Custom Tools

Use the `tool` helper exported from `@browserbasehq/stagehand` to define custom tools:

<CodeGroup>
```typescript Basic Tool
import { tool } from "@browserbasehq/stagehand";
import { z } from "zod";

const agent = stagehand.agent({
  model: "openai/gpt-5",
  tools: {
    getWeather: tool({
      description: 'Get the current weather in a location',
      inputSchema: z.object({
        location: z.string().describe('The location to get weather for'),
      }),
      execute: async ({ location }) => {
        // Your custom logic here
        const weather = await fetchWeatherAPI(location);
        return {
          location,
          temperature: weather.temp,
          conditions: weather.conditions,
        };
      },
    }),
  },
  systemPrompt: 'You are a helpful assistant with access to weather data.',
});

await agent.execute("What's the weather in San Francisco and should I bring an umbrella?");
```

```typescript Multiple Tools
import { tool } from "@browserbasehq/stagehand";
import { z } from "zod";

const agent = stagehand.agent({
  mode: "cua",
  model: "anthropic/claude-sonnet-4-20250514",
  tools: {
    searchDatabase: tool({
      description: 'Search for records in the database',
      inputSchema: z.object({
        query: z.string().describe('The search query'),
        limit: z.number().optional().describe('Max results to return'),
      }),
      execute: async ({ query, limit = 10 }) => {
        const results = await db.search(query, limit);
        return { results };
      },
    }),

    calculatePrice: tool({
      description: 'Calculate the total price with tax',
      inputSchema: z.object({
        amount: z.number().describe('The base amount'),
        taxRate: z.number().describe('Tax rate as decimal (e.g., 0.08 for 8%)'),
      }),
      execute: async ({ amount, taxRate }) => {
        const total = amount * (1 + taxRate);
        return { total: total.toFixed(2) };
      },
    }),
  },
});

await agent.execute("Find products under $50 and calculate the total with 8% tax");
```

```typescript Tool with API Integration
import { tool } from "@browserbasehq/stagehand";
import { z } from "zod";

const agent = stagehand.agent({
  model: "google/gemini-2.0-flash",
  tools: {
    sendEmail: tool({
      description: 'Send an email via SendGrid',
      inputSchema: z.object({
        to: z.string().email().describe('Recipient email address'),
        subject: z.string().describe('Email subject'),
        body: z.string().describe('Email body content'),
      }),
      execute: async ({ to, subject, body }) => {
        const response = await fetch('https://api.sendgrid.com/v3/mail/send', {
          method: 'POST',
          headers: {
            'Authorization': `Bearer ${process.env.SENDGRID_API_KEY}`,
            'Content-Type': 'application/json',
          },
          body: JSON.stringify({
            personalizations: [{ to: [{ email: to }] }],
            from: { email: 'noreply@example.com' },
            subject,
            content: [{ type: 'text/plain', value: body }],
          }),
        });

        return {
          sent: response.ok,
          messageId: response.headers.get('X-Message-Id'),
        };
      },
    }),
  },
});

await agent.execute("Fill out the contact form and send me a confirmation email at user@example.com");
```
</CodeGroup>

#### Custom Tools vs MCP Integrations

| Custom Tools                           | MCP Integrations                        |
|----------------------------------------|-----------------------------------------|
| Defined inline with your code          | Connect to external services            |
| Direct function execution              | Standard protocol                       |
| Better performance & optimized context | Reusable across applications            |
| Type-safe with TypeScript              | Access to pre-built integrations        |
| Granular control                       | Network-based communication             |

<Tip>
Use custom tools when you need specific functionality within your application. Use MCP integrations when connecting to external services or when you need standardized cross-application tools.
</Tip>

### Excluding Built-in Tools

Prevent the agent from using specific built-in tools during execution. This is useful when you want to restrict the agent's capabilities or avoid certain behaviors.

<Note>**Non-CUA agents only.** Requires `experimental: true`. Not available when `cua: true`.</Note>

#### Basic Usage

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for excludeTools
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

// Exclude screenshot and extract tools
const result = await agent.execute({
  instruction: "Navigate through the website and click the submit button",
  maxSteps: 15,
  excludeTools: ["screenshot", "extract"],
});
```

#### Available Tools by Mode

The tools you can exclude depend on the agent mode:

<Tabs>
<Tab title="DOM Mode (default)">

| Tool | Description |
|------|-------------|
| `act` | Perform semantic actions (click, type, etc.) |
| `fillForm` | Fill form fields using DOM selectors |
| `ariaTree` | Get accessibility tree of the page |
| `extract` | Extract structured data from page |
| `goto` | Navigate to a URL |
| `scroll` | Scroll using semantic directions (up/down/left/right) |
| `keys` | Press keyboard keys |
| `navback` | Navigate back in history |
| `screenshot` | Take a screenshot |
| `think` | Agent reasoning/planning step |
| `wait` | Wait for time or condition |
| `search` | Web search (requires `useSearch: true` and `BROWSERBASE_API_KEY`) |

</Tab>

<Tab title="Hybrid Mode">

| Tool | Description |
|------|-------------|
| `click` | Click at specific coordinates |
| `type` | Type text at coordinates |
| `dragAndDrop` | Drag from one point to another |
| `clickAndHold` | Click and hold at coordinates |
| `fillFormVision` | Fill forms using vision/coordinates |
| `act` | Perform semantic actions |
| `ariaTree` | Get accessibility tree |
| `extract` | Extract data from page |
| `goto` | Navigate to URL |
| `scroll` | Scroll using coordinates |
| `keys` | Press keyboard keys |
| `navback` | Navigate back |
| `screenshot` | Take screenshot |
| `think` | Agent reasoning step |
| `wait` | Wait for time/condition |
| `search` | Web search (requires `useSearch: true` and `BROWSERBASE_API_KEY`) |

</Tab>
</Tabs>

#### Use Cases

```typescript
// Prevent the agent from taking screenshots during execution
const result = await agent.execute({
  instruction: "Fill out the contact form",
  excludeTools: ["screenshot"],
});

// Prevent the agent from extracting data
const result = await agent.execute({
  instruction: "Click through the signup flow",
  excludeTools: ["extract"],
});

// Disable web search capability
const result = await agent.execute({
  instruction: "Find information on the current page",
  excludeTools: ["search"],
});
```

## Web Search

Enable the `search` tool by setting `useSearch: true` in `agent.execute()`. This gives the agent the ability to perform web searches using the Browserbase Search API, which is useful when the agent needs to find URLs or gather information before navigating.

<Note>Requires a valid Browserbase API key. Set `BROWSERBASE_API_KEY` in your environment, or pass `apiKey` in the Stagehand constructor.</Note>

```typescript
const result = await agent.execute({
  instruction: "Find the latest pricing for Browserbase",
  useSearch: true,
  maxSteps: 20,
});
```

## Variables

Use variables to pass sensitive data (like passwords, API keys, or personal information) to the agent without exposing the actual values to the LLM. The agent sees only variable names and descriptions, while the actual values are substituted at runtime.

<Note>**Non-CUA agents only.** Variables require `experimental: true` and are not available with Computer Use Agents.</Note>

### Basic Usage

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for variables
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com/login");

const result = await agent.execute({
  instruction: "Log into the website using my credentials",
  maxSteps: 10,
  variables: {
    username: {
      value: "john@example.com",
      description: "The user's email address for login"
    },
    password: {
      value: process.env.USER_PASSWORD,
      description: "The user's password for login"
    }
  }
});
```

Variables use the same type as `act()`. You can pass simple values or rich objects with descriptions:

```typescript
// Simple values (same format as act)
variables: {
  username: "john@example.com",
  password: "secret123",
}

// Rich values with descriptions (helps the agent understand context)
variables: {
  username: { value: "john@example.com", description: "The login email" },
  password: { value: "secret123", description: "The login password" },
}
```

### How Variables Work

1. **LLM receives descriptions only**: The agent sees variable names and descriptions in its system prompt, but never the actual values
2. **Placeholder syntax**: The LLM uses `%variableName%` syntax when it needs to use a variable (e.g., "type %password% into the password field")
3. **Runtime substitution**: Actual values are substituted just before the action executes
4. **Secure logging**: Variable values are never logged or returned in tool outputs

### Supported Tools

Variables work with the following agent tools:

<Tabs>
<Tab title="DOM Mode">

| Tool | Usage |
|------|-------|
| `act` | Use `%variableName%` in the action description |
| `fillForm` | Use `%variableName%` in field values |

</Tab>

<Tab title="Hybrid Mode">

| Tool | Usage |
|------|-------|
| `type` | Use `%variableName%` in the text to type |
| `fillFormVision` | Use `%variableName%` in field values |
| `act` | Use `%variableName%` in the action description |

</Tab>
</Tabs>

### Cache Optimization

Variables are cache-friendly by design:
- Cache keys use only variable names, not values
- Changing variable values (e.g., different passwords) won't invalidate cached executions
- This enables efficient replay of the same workflow with different credentials

### Best Practices

<Tabs>
<Tab title="Do this">
```typescript
// Use variables for sensitive data
variables: {
  apiKey: {
    value: process.env.API_KEY,
    description: "API key for authentication"
  }
}
```
</Tab>

<Tab title="Don't do this">
```typescript
// Don't hardcode sensitive values in instructions
instruction: "Log in with password 'secret123'"
```
</Tab>
</Tabs>

<Tip>
Use descriptive names and descriptions for variables. The LLM relies on the description to understand when and how to use each variable.
</Tip>

## MCP Integrations

Agents can be enhanced with external tools and services through MCP (Model Context Protocol) integrations. This allows your agent to access external APIs and data sources beyond just browser interactions.

<CodeGroup>
```typescript Pass URL
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "openai/computer-use-preview",
        apiKey: process.env.OPENAI_API_KEY
    },
    integrations: [
      `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
    ],
    systemPrompt: `You have access to web search through Exa. Use it to find current information before browsing.`
});

await agent.execute("Search for the best headphones of 2025 and go through checkout for the top recommendation");
```

```typescript Create Connection
import { connectToMCPServer } from "@browserbasehq/stagehand";

const supabaseClient = await connectToMCPServer(
  `https://server.smithery.ai/@supabase-community/supabase-mcp/mcp?api_key=${process.env.SMITHERY_API_KEY}`
);

const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "openai/computer-use-preview",
        apiKey: process.env.OPENAI_API_KEY
    },
    integrations: [supabaseClient],
    systemPrompt: `You can interact with Supabase databases. Use these tools to store and retrieve data.`
});

await agent.execute("Search for restaurants and save the first result to the database");
```
</CodeGroup>

<Tip>
MCP integrations enable agents to be more powerful by combining browser automation with external APIs, databases, and services. The agent can intelligently decide when to use browser actions versus external tools.
</Tip>

## Streaming

Enable streaming mode to receive incremental responses from the agent. This is useful for building real-time UIs that show the agent's reasoning as it progresses.

<Warning>
**Non-CUA agents only.** Streaming, callbacks, abort signals, and message continuation are only available when using the standard agent (without `mode: "cua"`). These features are not supported with Computer Use Agents.
</Warning>

<Note>These are experimental features. Set `experimental: true` in your Stagehand constructor to enable them.</Note>

### Enabling Streaming Mode

Set `stream: true` in the agent configuration to enable streaming:

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for streaming
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
  stream: true, // Enable streaming mode
});

const streamResult = await agent.execute({
  instruction: "Search for headphones on Amazon",
  maxSteps: 20,
});

// Stream the text output incrementally
for await (const delta of streamResult.textStream) {
  process.stdout.write(delta);
}

// Get the final result after streaming completes
const finalResult = await streamResult.result;
console.log("Completed:", finalResult.completed);
```

### Stream Properties

When streaming is enabled, `execute()` returns an `AgentStreamResult` with:

| Property | Type | Description |
|----------|------|-------------|
| `textStream` | `AsyncIterable<string>` | Incremental text output from the agent |
| `fullStream` | `AsyncIterable<StreamPart>` | All stream events including tool calls and messages |
| `result` | `Promise<AgentResult>` | Final result after streaming completes |

```typescript
// Stream everything (tool calls, messages, etc.)
for await (const event of streamResult.fullStream) {
  console.log(event);
}
```

## Callbacks

Callbacks let you hook into the agent's execution lifecycle to monitor progress, log events, or modify behavior.

<Note>**Non-CUA agents only.** Callbacks require `experimental: true` and are not available with Computer Use Agents.</Note>

### Available Callbacks

<Tabs>
<Tab title="Non-Streaming">

When `stream: false` (default), these callbacks are available:

| Callback | Description |
|----------|-------------|
| `prepareStep` | Called before each LLM step to modify settings |
| `onStepFinish` | Called when each step completes |

```typescript
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

await agent.execute({
  instruction: "Fill out the contact form",
  maxSteps: 10,
  callbacks: {
    prepareStep: async (stepContext) => {
      console.log(`Starting step ${stepContext.stepNumber}`);
      return stepContext; // Return modified or original context
    },
    onStepFinish: async (event) => {
      console.log(`Step finished: ${event.finishReason}`);
      if (event.toolCalls) {
        for (const tc of event.toolCalls) {
          console.log(`Tool called: ${tc.toolName}`);
        }
      }
    },
  },
});
```

</Tab>

<Tab title="Streaming">

When `stream: true`, additional callbacks are available:

| Callback | Description |
|----------|-------------|
| `prepareStep` | Called before each LLM step to modify settings |
| `onStepFinish` | Called when each step completes |
| `onChunk` | Called for each stream chunk |
| `onFinish` | Called when streaming completes |
| `onError` | Called when an error occurs |
| `onAbort` | Called when the stream is aborted |

```typescript
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
  stream: true,
});

const streamResult = await agent.execute({
  instruction: "Search for products",
  maxSteps: 15,
  callbacks: {
    onChunk: async (chunk) => {
      // Called for each incremental chunk
      console.log("Chunk received:", chunk);
    },
    onStepFinish: async (event) => {
      console.log(`Step completed: ${event.finishReason}`);
    },
    onFinish: (event) => {
      console.log("Stream finished!");
      console.log("Total steps:", event.steps.length);
    },
    onError: ({ error }) => {
      console.error("Stream error:", error);
    },
    onAbort: (event) => {
      console.log("Stream aborted after", event.steps.length, "steps");
    },
  },
});

// Don't forget to consume the stream
for await (const delta of streamResult.textStream) {
  process.stdout.write(delta);
}

await streamResult.result;
```

</Tab>
</Tabs>

<Warning>
Streaming-only callbacks (`onChunk`, `onFinish`, `onError`, `onAbort`) will throw an error if used without `stream: true`. If you need these callbacks, enable streaming in your agent configuration.
</Warning>

## Abort Signal

Cancel agent execution at any time using an `AbortSignal`. This is useful for implementing timeouts or allowing users to stop long-running tasks.

<Note>**Non-CUA agents only.** Abort signals require `experimental: true` and are not available with Computer Use Agents.</Note>

### Basic Usage

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for abort signal
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const controller = new AbortController();

// Set a 30 second timeout
setTimeout(() => controller.abort(), 30000);

try {
  const result = await agent.execute({
    instruction: "Complete a complex multi-step task",
    maxSteps: 50,
    signal: controller.signal,
  });
} catch (error) {
  if (error.name === "AgentAbortError") {
    console.log("Task was cancelled");
  }
}
```

### Abort with Streaming

Abort signals also work with streaming mode:

```typescript
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
  stream: true,
});

const controller = new AbortController();

const streamResult = await agent.execute({
  instruction: "Describe every element on the page",
  maxSteps: 50,
  signal: controller.signal,
  callbacks: {
    onAbort: (event) => {
      console.log(`Aborted after ${event.steps.length} steps`);
    },
  },
});

// Abort after receiving 10 chunks
let chunkCount = 0;
for await (const delta of streamResult.textStream) {
  process.stdout.write(delta);
  chunkCount++;
  if (chunkCount >= 10) {
    controller.abort();
    break;
  }
}

// The result promise will reject with AgentAbortError
try {
  await streamResult.result;
} catch (error) {
  console.log("Stream was aborted:", error.message);
}
```

### Custom Abort Reasons

You can pass a reason when aborting:

```typescript
controller.abort("User cancelled the operation");

// The error message will include your reason
// Error: "User cancelled the operation"
```

## Message Continuation

Continue a conversation across multiple agent executions by passing the `messages` from a previous result. This is useful for multi-turn interactions or breaking complex tasks into steps while maintaining context.

<Note>**Non-CUA agents only.** Message continuation requires `experimental: true` and is not available with Computer Use Agents.</Note>

### Basic Continuation

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for message continuation
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com/products");

// First execution: search for products
const firstResult = await agent.execute({
  instruction: "Search for wireless headphones and note the top 3 results",
  maxSteps: 10,
});

console.log("First task:", firstResult.message);

// Continue with the same context: ask follow-up
const secondResult = await agent.execute({
  instruction: "Now filter by price under $100 and tell me which of those 3 are still available",
  maxSteps: 10,
  messages: firstResult.messages, // Pass previous conversation
});

console.log("Follow-up:", secondResult.message);

// Continue further: take action based on conversation history
const thirdResult = await agent.execute({
  instruction: "Add the cheapest one to the cart",
  maxSteps: 10,
  messages: secondResult.messages, // Chain the conversation
});

console.log("Final action:", thirdResult.message);
```

## Structured Output

Define a Zod schema to receive structured data when the agent completes its task. This is useful when you need specific information extracted from the agent's execution, such as prices, dates, or other structured data.

<Note>**Non-CUA agents only.** Structured output requires `experimental: true` and is not available with Computer Use Agents.</Note>

<Tip>Use `.describe()` on schema fields to help the agent understand what data to extract.</Tip>

<CodeGroup>
```typescript Basic Usage
import { z } from "zod";

const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for structured output
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://www.google.com/flights");

const result = await agent.execute({
  instruction: "Find the cheapest flight from NYC to LA for next week",
  maxSteps: 20,
  output: z.object({
    price: z.string().describe("The price of the flight"),
    airline: z.string().describe("The airline name"),
    departureTime: z.string().describe("Departure time"),
    arrivalTime: z.string().describe("Arrival time"),
  }),
});

// Access the structured output
console.log(result.output);
// { price: "$199", airline: "Delta", departureTime: "8:00 AM", arrivalTime: "11:30 AM" }
```

```typescript Complex Schema
const result = await agent.execute({
  instruction: "Extract all items from the shopping cart",
  output: z.object({
    items: z.array(z.object({
      name: z.string().describe("Product name"),
      quantity: z.number().describe("Quantity in cart"),
      unitPrice: z.string().describe("Price per item"),
      totalPrice: z.string().describe("Total price for this item"),
    })).describe("List of items in the cart"),
    subtotal: z.string().describe("Cart subtotal before tax"),
    tax: z.string().optional().describe("Tax amount if shown"),
    total: z.string().describe("Final total"),
  }),
});

console.log(`Found ${result.output?.items.length} items in cart`);
console.log(`Total: ${result.output?.total}`);
```

```typescript With Streaming
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
  stream: true,
});

const streamResult = await agent.execute({
  instruction: "Find the top 3 search results",
  output: z.object({
    results: z.array(z.object({
      title: z.string().describe("The title of the search result"),
      url: z.string().url().describe("The URL of the search result"),
      snippet: z.string().describe("A brief description or snippet"),
    })).max(3).describe("Top 3 search results"),
  }),
});

// Stream the text output
for await (const delta of streamResult.textStream) {
  process.stdout.write(delta);
}

// Get the structured output from the final result
const finalResult = await streamResult.result;
console.log(finalResult.output?.results);
```
</CodeGroup>

## Agent Execution Configuration

<Warning>
Stagehand uses a 1288x711 viewport by default. Other viewport sizes may reduce performance. If you need to modify the viewport, you can edit in the [Browser Configuration](/v3/configuration/browser).
</Warning>

Control the maximum number of steps the agent can take to complete the task using the `maxSteps` parameter.

<CodeGroup>
```typescript TypeScript
// Set maxSteps to control how many actions the agent can take
await agent.execute({
  instruction: "Sign me up for a library card",
  maxSteps: 15 // Agent will stop after 15 steps if task isn't complete
});
```

For complex tasks, increase the `maxSteps` limit and check task success.

```typescript
// Complex multi-step task requiring more actions
const result = await agent.execute({
  instruction: "Find and apply for software engineering jobs, filtering by remote work and saving 3 applications",
  maxSteps: 30, // Higher limit for complex workflows
});

// Check if the task completed successfully
if (result.success === true) {
  console.log("Task completed successfully!");
} else {
  console.log("Task failed or was incomplete");
}
```
</CodeGroup>

## Best Practices

Following these best practices will improve your agent's success rate, reduce execution time, and minimize unexpected errors during task completion.

### Start on the Right Page
Navigate to your target page before executing tasks:

<Tabs>
<Tab title="Do this">
```typescript
await page.goto('https://github.com/browserbase/stagehand');
await agent.execute('Get me the latest PR on the stagehand repo');
```
</Tab>

<Tab title="Don't do this">
```typescript
await agent.execute('Go to GitHub and find the latest PR on browserbase/stagehand');
```
</Tab>
</Tabs>


### Be Specific
Provide detailed instructions for better results:

<Tabs>
<Tab title="Do this">
```typescript
await agent.execute("Find Italian restaurants in Brooklyn that are open after 10pm and have outdoor seating");
```
</Tab>

<Tab title="Don't do this">
```typescript
await agent.execute("Find a restaurant");
```
</Tab>
</Tabs>

## Troubleshooting

<AccordionGroup>


<Accordion title="Agent is stopping before completing the task">
**Problem**: Agent stops before finishing the requested task

**Solutions**:
- Check if the agent is hitting the maxSteps limit (default is 20)
- Increase maxSteps for complex tasks: `maxSteps: 30` or higher
- Break very complex tasks into smaller sequential executions

```typescript
// Increase maxSteps for complex tasks
await agent.execute({
  instruction: "Complete the multi-page registration form with all required information",
  maxSteps: 40 // Increased limit for complex task
});

// Or break into smaller tasks with success checking
const firstResult = await agent.execute({
  instruction: "Fill out page 1 of the registration form", 
  maxSteps: 15
});

// Only proceed if the first task was successful
if (firstResult.success === true) {
  await agent.execute({
    instruction: "Navigate to page 2 and complete remaining fields",
    maxSteps: 15
  });
} else {
  console.log("First task failed, stopping execution");
}
```
</Accordion>

<Accordion title="Agent is failing to click the proper elements">
**Problem**: Agent clicks on wrong elements or fails to interact with the correct UI components

**Solutions**:
- Ensure proper viewport size: Stagehand uses `1288x711` by default (optimal for Computer Use models)
- Avoid changing viewport dimensions as other sizes may reduce performance
</Accordion>


</AccordionGroup>


## Next steps

<CardGroup cols={2}>
<Card title="Act" icon="play" href="/v3/basics/act">
  Execute actions efficiently using observe results
</Card>

<Card title="Extract" icon="download" href="/v3/basics/extract">
  Extract structured data from observed elements
</Card>
</CardGroup>

================================================
FILE: packages/docs/v3/basics/evals.mdx
================================================
---
title: Evaluations & Metrics
sidebarTitle: Evals
description: Monitor performance, optimize costs, and evaluate LLM effectiveness
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Evaluations help you understand how well your automation performs, which models work best for your use cases, and how to optimize for cost and reliability. This guide covers both monitoring your own workflows and running comprehensive evaluations.

## Why Evaluations Matter

- **Performance Optimization**: Identify which models and settings work best for your specific automation tasks
- **Cost Control**: Track token usage and inference time to optimize spending
- **Reliability**: Measure success rates and identify failure patterns
- **Model Selection**: Compare different LLMs on real-world tasks to make informed decisions

<Card
  title="Live Model Comparisons"
  icon="scale-balanced"
  href="https://www.stagehand.dev/evals"
>
  View real-time performance comparisons across different LLMs on the [Stagehand Evals Dashboard](https://www.stagehand.dev/evals)
</Card>

## Comprehensive Evaluations

Evaluations help you systematically test and improve your automation workflows. Stagehand provides both built-in evaluations and tools to create your own.

### Evals CLI
![Evals CLI](/media/evals-cli.png)

<Tip>
To run evals, you'll need to clone the [Stagehand repo](https://github.com/browserbase/stagehand) and set up the CLI.

We recommend using [Braintrust](https://www.braintrust.dev/docs/) to help visualize evals results and metrics.
</Tip>

The Stagehand CLI provides a powerful interface for running evaluations. You can run specific evals, categories, or external benchmarks with customizable settings.

Evals are grouped into:
1. **Act Evals** - These are evals that test the functionality of the `act` method.
2. **Extract Evals** - These are evals that test the functionality of the `extract` method.
3. **Observe Evals** - These are evals that test the functionality of the `observe` method.
4. **Combination Evals** - These are evals that test the functionality of the `act`, `extract`, and `observe` methods together.
5. **Experimental Evals** - These are experimental custom evals that test the functionality of the stagehand primitives.
6. **Agent Evals** - These are evals that test the functionality of `agent`.
7. **(NEW) External Benchmarks** - Run external benchmarks like WebBench, GAIA, WebVoyager, OnlineMind2Web, and OSWorld.

#### Installation

<Steps> 
<Step title="Install Dependencies">
```bash
# From the stagehand root directory
pnpm install
```
</Step>

<Step title="Build the CLI">
```bash
pnpm run build:cli
```
</Step>

<Step title="Verify Installation">
```bash
evals help
```
</Step>
</Steps>

#### CLI Commands and Options

##### Basic Commands

```bash
# Run all evals
evals run all

# Run specific category
evals run act
evals run extract
evals run observe
evals run agent

# Run specific eval
evals run extract/extract_text

# List available evals
evals list
evals list --detailed

# Configure defaults
evals config
evals config set env browserbase
evals config set trials 5
```

##### Command Options

- **`-e, --env`**: Environment (`local` or `browserbase`)
- **`-t, --trials`**: Number of trials per eval (default: 3)
- **`-c, --concurrency`**: Max parallel sessions (default: 10)
- **`-m, --model`**: Model override
- **`-p, --provider`**: Provider override
- **`--api`**: Use Stagehand API instead of SDK

##### Running External Benchmarks

The CLI supports several industry-standard benchmarks:

```bash
# WebBench with filters
evals run benchmark:webbench -l 10 -f difficulty=easy -f category=READ

# GAIA benchmark
evals run b:gaia -s 100 -l 25 -f level=1

# WebVoyager
evals run b:webvoyager -l 50

# OnlineMind2Web
evals run b:onlineMind2Web

# OSWorld
evals run b:osworld -f source=Mind2Web
```

#### Configuration Files

You can view the specific evals in [`evals/tasks`](https://github.com/browserbase/stagehand/tree/main/packages/evals/tasks). Each eval is grouped into eval categories based on [`evals/evals.config.json`](https://github.com/browserbase/stagehand/blob/main/evals/evals.config.json).


#### Viewing eval results
![Eval results](/images/evals.png)

Eval results are viewable on Braintrust. You can view the results of a specific eval by going to the Braintrust URL specified in the terminal when you run `npm run evals`.

By default, each eval will run five times per model. The "Exact Match" column shows the percentage of times the eval was correct. The "Error Rate" column shows the percentage of times the eval errored out.

You can use the Braintrust UI to filter by model/eval and aggregate results across all evals.

## Creating Custom Evaluations

### Step-by-Step Guide

<Steps>
<Step title="Create Evaluation File">
Create a new file in `evals/tasks/your-eval.ts`:

```typescript
import { EvalTask } from '../types';

export const customEvalTask: EvalTask = {
  name: 'custom_task_name',
  description: 'Test specific automation workflow',
  
  // Test setup
  setup: async ({ page }) => {
    await page.goto('https://example.com');
  },
  
  // The actual test
  task: async ({ stagehand, page }) => {
    // Your automation logic
    await stagehand.act({ action: 'click the login button' });
    const result = await stagehand.extract({ 
      instruction: 'Get the user name',
      schema: { username: 'string' }
    });
    return result;
  },
  
  // Validation
  validate: (result, expected) => {
    return result.username === expected.username;
  },
  
  // Test cases
  testCases: [
    {
      input: { /* test input */ },
      expected: { username: 'john_doe' }
    }
  ],
  
  // Evaluation criteria
  scoring: {
    exactMatch: true,
    timeout: 30000,
    retries: 2
  }
};
```
</Step>

<Step title="Add to Configuration">
Update `evals/evals.config.json`:

```json
{
  "categories": {
    "custom": ["custom_task_name"],
    "existing_category": ["custom_task_name"]
  }
}
```
</Step>

<Step title="Run Your Evaluation">
```bash
# Test your custom evaluation
evals run custom_task_name

# Run the entire custom category
evals run custom

# Run with specific settings
evals run custom_task_name -e browserbase -t 5 -m gpt-4o
```
</Step>
</Steps>


## Best Practices for Custom Evals

<AccordionGroup>
<Accordion title="Test Design Principles">
- **Atomic**: Each test should validate one specific capability
- **Deterministic**: Tests should produce consistent, measurable results
- **Realistic**: Use real-world scenarios and websites
- **Measurable**: Define clear success/failure criteria
</Accordion>

<Accordion title="Performance Optimization">
- **Parallel Execution**: Design tests to run independently
- **Resource Management**: Clean up after each test
- **Timeout Handling**: Set appropriate timeouts for operations
- **Error Recovery**: Handle failures gracefully
</Accordion>

<Accordion title="Data Quality">
- **Ground Truth**: Establish reliable expected outcomes
- **Edge Cases**: Test boundary conditions and error scenarios
- **Statistical Significance**: Run multiple iterations for reliability
- **Version Control**: Track changes to test cases over time
</Accordion>
</AccordionGroup>

### Troubleshooting Evaluations
<AccordionGroup>
<Accordion title="Evaluation Timeouts">
**Symptoms**: Tests fail with timeout errors

**Solutions**:
- Increase timeout in `taskConfig.ts`
- Use faster models (Gemini 2.5 Flash, Claude Haiku 4.5)
- Optimize test scenarios to be less complex
- Check network connectivity to LLM providers
</Accordion>

<Accordion title="Inconsistent Results">
**Symptoms**: Same test passes/fails randomly

**Solutions**:
- Set temperature to 0 for deterministic outputs
- Increase repetitions for statistical significance
- Use more capable models for complex tasks
- Check for dynamic website content affecting tests
</Accordion>

<Accordion title="High Evaluation Costs">
**Symptoms**: Token usage exceeding budget

**Solutions**:
- Use cost-effective models (Gemini 2.5 Flash, Claude Haiku 4.5)
- Reduce repetitions for initial testing
- Focus on specific evaluation categories
- Use local browser environment to reduce Browserbase costs
</Accordion>

<Accordion title="Braintrust Integration Issues">
**Symptoms**: Results not uploading to dashboard

**Solutions**:
- Check Braintrust API key configuration
- Verify internet connectivity
- Update Braintrust SDK to latest version
- Check project permissions in Braintrust dashboard
</Accordion>
</AccordionGroup>

================================================
FILE: packages/docs/v3/basics/extract.mdx
================================================
---
title: Extract
description: Extract structured data from a webpage
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## What is `extract()`?

```typescript
await stagehand.extract("extract the name of the repository");
```

`extract()` grabs structured data from a webpage. You can define your schema with [Zod](https://github.com/colinhacks/zod) (TypeScript) or JSON. If you don't want to define a schema, you can also call `extract` with just a [natural language prompt](#instruction-only), or call `extract` [with no parameters](#no-parameters).

## Why use `extract()`?

<CardGroup cols={2}>
  <Card title="Structured" icon="brackets-curly" href="#basic-schema">
    Turn messy webpage data into clean objects that follow a schema.
  </Card>
  <Card title="Resilient" icon="dumbbell" href="#extract-with-context">
    Build resilient extractions that don't break when the website changes
  </Card>
</CardGroup>

## Return value

When you use `extract()`, Stagehand will return a `Promise<ExtractResult>` with the following structure:
<Tabs>
<Tab title="Basic Schema">

When extracting with a schema, the return type is inferred from your Zod schema:

```typescript
const result = await stagehand.extract(
  "extract product details",
  z.object({
    name: z.string(),
    price: z.number(),
    inStock: z.boolean()
  })
);
```

**Example result:**
```typescript
{
  name: "Wireless Mouse",
  price: 29.99,
  inStock: true
}
```

</Tab>
<Tab title="Array">

When extracting an array, you get an array of objects:

```typescript
const apartments = await stagehand.extract(
  "extract all apartment listings",
  z.array(
    z.object({
      address: z.string(),
      price: z.string(),
      sqft: z.number()
    })
  )
);
```

**Example result:**
```typescript
[
  {
    address: "123 Main St",
    price: "$1,200/mo",
    sqft: 750
  },
  {
    address: "456 Oak Ave",
    price: "$1,500/mo",
    sqft: 900
  }
]
```

</Tab>
<Tab title="Primitive">

When extracting a single primitive value:

```typescript
const price = await stagehand.extract(
  "extract the price",
  z.number()
);
```

**Example result:**
```typescript
19.99
```

You can also extract strings, booleans, etc.:

```typescript
const url = await stagehand.extract(
  "extract the contact page link",
  z.string().url()
);
```

</Tab>
<Tab title="Instruction Only">

When calling with just an instruction (no schema):

```typescript
const result = await stagehand.extract("extract the repository name");
```

**Example result:**
```typescript
{
  extraction: "stagehand"
}
```

</Tab>
<Tab title="No Parameters">

When calling with no parameters:

```typescript
const result = await stagehand.extract();
```

**Example result:**
```typescript
{
  pageText: "Accessibility Tree:\n[0-2] RootWebArea: Page Title\n  [0-37] scrollable\n    [0-118] body\n      ..."
}
```

This returns the accessibility tree representation of the page without LLM processing.

</Tab>
</Tabs>

## Advanced Configuration

You can pass additional options to configure the model, timeout, and selector scope:
```typescript
const result = await stagehand.extract("extract the repository name", {
  model: "anthropic/claude-sonnet-4-5",
  timeout: 30000,
  selector: "//header" // Focus on specific area
});
```

### Server-side Caching

<Note>
`serverCache` only works when running with `env: "BROWSERBASE"`. It has no effect in local environments.
</Note>

When running on Browserbase, Stagehand automatically caches `extract()` results server-side. Repeated calls with the same inputs return instantly without consuming LLM tokens. Caching is enabled by default and can be controlled globally on the constructor or overridden per call:

```typescript
// Disable server-side caching for the entire instance
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  serverCache: false,
});

// Or disable it for a single call
const data = await stagehand.extract("extract the repository name", { serverCache: false });

// Check whether a result was served from cache
const result = await stagehand.extract("extract the page title");
console.log(result.cacheStatus); // "HIT" or "MISS"
```

### Targeted Extract

Pass a selector to `extract` to target a specific element on the page.
<Tip>
This helps reduce the context passed to the LLM, optimizing token usage/speed and improving accuracy.
</Tip>
```typescript
const tableData = await stagehand.extract(
  "Extract the values of the third row",
  z.object({
    values: z.array(z.string())
  }),
  {
    // xPath or CSS selector
    selector: "xpath=/html/body/div/table/" 
  }
);
```


## Best practices


### Extract with Context

You can provide additional context to your schema to help the model extract the data more accurately.

```typescript
const apartments = await stagehand.extract(
  "Extract ALL the apartment listings and their details, including address, price, and square feet.",
  z.array(
    z.object({
      address: z.string().describe("the address of the apartment"),
      price: z.string().describe("the price of the apartment"),
      square_feet: z.string().describe("the square footage of the apartment"),
    })
  )
);
```

### Link Extraction
<Note>
To extract links or URLs, define the relevant field as `z.string().url()`.
</Note>

Here is how an `extract` call might look for extracting a link or URL. This also works for image links.

```typescript
const contactLink = await stagehand.extract(
  "extract the link to the 'contact us' page",
  z.string().url() // note the usage of z.string().url() for URL validation
);

console.log("the link to the contact us page is: ", contactLink);
```

<Tip>
Inside Stagehand, extracting links works by asking the LLM to select an ID. Stagehand looks up that ID in a mapping of IDs -> URLs. When logging the LLM trace, you should expect to see IDs. The actual URLs will be included in the final `ExtractResult`.
</Tip>

## Troubleshooting

<AccordionGroup>
<Accordion title="Empty or partial results">
**Problem**: `extract()` returns empty or incomplete data

**Solutions**:
- **Check your instruction clarity**: Make sure your instruction is specific and describes exactly what data you want to extract
- **Verify the data exists**: Use `stagehand.observe()` first to confirm the data is present on the page
- **Wait for dynamic content**: If the page loads content dynamically, use `stagehand.act("wait for the content to load")` before extracting

**Solution: Wait for content before extracting**
```typescript
// Wait for content before extracting
await stagehand.act("wait for the product listings to load");
const products = await stagehand.extract(
  "extract all product names and prices",
  z.array(z.object({
    name: z.string(),
    price: z.string()
  }))
);
```
</Accordion>

<Accordion title="Schema validation errors">
**Problem**: Getting schema validation errors or type mismatches

**Solutions**:
- **Use optional fields**: Make fields optional with `z.optional()` if the data might not always be present
- **Use flexible types**: Consider using `z.string()` instead of `z.number()` for prices that might include currency symbols
- **Add descriptions**: Use `.describe()` to help the model understand field requirements

**Solution: More flexible schema**
```typescript
const schema = z.object({
  price: z.string().describe("price including currency symbol, e.g., '$19.99'"),
  availability: z.string().optional().describe("stock status if available"),
  rating: z.number().optional()
});
```
</Accordion>

<Accordion title="Inconsistent results">
**Problem**: Extraction results vary between runs

**Solutions**:
- **Be more specific in instructions**: Instead of "extract prices", use "extract the numerical price value for each item"
- **Use context in schema descriptions**: Add field descriptions to guide the model
- **Combine with observe**: Use `stagehand.observe()` to understand the page structure first

**Solution: Validate with observe first**
```typescript
// First observe to understand the page structure
const elements = await stagehand.observe("find all product listings");
console.log("Found elements:", elements.map(e => e.description));

// Then extract with specific targeting
const products = await stagehand.extract(
  "extract name and price from each product listing shown on the page",
  z.array(z.object({
    name: z.string().describe("the product title or name"),
    price: z.string().describe("the price as displayed, including currency")
  }))
);
```
</Accordion>

<Accordion title="Performance issues">
**Problem**: Extraction is slow or timing out

**Solutions**:
- **Reduce scope**: Extract smaller chunks of data in multiple calls rather than everything at once
- **Use targeted instructions**: Be specific about which part of the page to focus on
- **Consider pagination**: For large datasets, extract one page at a time
- **Increase timeout**: Use `timeoutMs` parameter for complex extractions

**Solution: Break down large extractions**
```typescript
// Instead of extracting everything at once
const allData = [];
const pageNumbers = [1, 2, 3, 4, 5];

for (const pageNum of pageNumbers) {
  await stagehand.act(`navigate to page ${pageNum}`);

  const pageData = await stagehand.extract(
    "extract product data from the current page only",
    z.array(z.object({
      name: z.string(),
      price: z.number()
    })),
    { timeout: 60000 } // 60 second timeout
  );

  allData.push(...pageData);
}
```
</Accordion>
</AccordionGroup>

## Next steps

<CardGroup cols={2}>

  <Card title="Act" icon="play" href="/v3/basics/act">
    Execute actions efficiently
  </Card>

  <Card title="Observe" icon="magnifying-glass" href="/v3/basics/observe">
    Analyze pages and preview actions
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v3/basics/observe.mdx
================================================
---
title: Observe
sidebarTitle: Observe
description: 'Discover and plan executable actions on any web page'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## What is `observe()`?

```typescript
await stagehand.observe("find the login button");
```

`observe()` discovers actionable elements on a page and returns structured actions you can execute or validate before acting. Use it to explore pages, plan multi-step workflows, cache actions, and validate elements before acting.

## Why use `observe()`?

<CardGroup cols={2}>
  <Card title="Explore" icon="compass" href="#using-observe">
    Discover what's possible on a page—find buttons, forms, links, and interactive elements
  </Card>
  <Card title="Plan" icon="map" href="#plan-then-execute">
    Map out multi-step workflows by discovering all required actions upfront
  </Card>
  <Card title="Cache" icon="database" href="/v3/best-practices/caching">
    Store discovered actions to skip LLM calls and speed up repeated workflows
  </Card>
  <Card title="Validate" icon="check" href="#validate-before-acting">
    Verify elements exist and check their properties before performing critical actions
  </Card>
</CardGroup>

## Using `observe()`

Use `observe()` to discover actionable elements on a page. Here's how to find a button:

```typescript
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");
const actions = await stagehand.observe("find the learn more button");
```

<Note>
**iFrame and Shadow DOM Support** Stagehand automatically handles iFrame traversal and shadow DOM elements without requiring additional configuration.
</Note>

<Accordion title="Common use cases">

| Use Case | Example instruction |
|----------|---------------------|
| Find buttons | `find the submit button` |
| Locate forms | `find all input fields in the form` |
| Discover links | `find navigation links` |
| Identify tables | `find the pricing table` |
| Map workflows | `find all checkout steps` |
| Validate elements | `find the delete account button` |

</Accordion>


### Return value of `observe()`?
When you use `observe()`, Stagehand will return a `Promise<Action[]>` with the following structure:
``` typescript
[
  {
    description: 'Learn more button',
    method: 'click',
    arguments: [],
    selector: 'xpath=/html[1]/body[1]/shadow-demo[1]//div[1]/button[1]'
  }
]
```

<Tabs>
<Tab title="Do this">
Use specific, descriptive instructions.

```typescript
// Clear and specific
await stagehand.observe("find the primary call-to-action button in the hero section");
await stagehand.observe("find all input fields in the checkout form");
await stagehand.observe("find the delete account button in settings");
```
</Tab>

<Tab title="Don't do this">
Avoid vague or data-oriented queries.

```typescript
// Too vague
await stagehand.observe("find buttons");

// Use extract() for data instead
await stagehand.observe("what is the page title?");
```
</Tab>
</Tabs>

## Advanced Configuration

You can pass additional options to configure the model, timeout, and selector scope:

```typescript
// Custom model configuration
const actions = await stagehand.observe("find navigation links", {
  model: "openai/gpt-4o",
  timeout: 30000,
  selector: "//header" // Focus on specific area
});
```

### Server-side Caching

<Note>
`serverCache` only works when running with `env: "BROWSERBASE"`. It has no effect in local environments.
</Note>

When running on Browserbase, Stagehand automatically caches `observe()` results server-side. Repeated calls with the same inputs return instantly without consuming LLM tokens. Caching is enabled by default and can be controlled globally on the constructor or overridden per call:

```typescript
// Disable server-side caching for the entire instance
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  serverCache: false,
});

// Or disable it for a single call
const actions = await stagehand.observe("find the login button", { serverCache: false });
```

<Note>
  `observe()` does not currently expose a `cacheStatus` field. To check whether an `observe()` call was served from cache, use the [Browserbase session replay dashboard](https://docs.browserbase.com/features/observability#stagehand) or inspect the session logs.
</Note>

### Using with Custom Pages

You can use `observe()` with pages from other browser automation libraries like Puppeteer, Playwright, or Patchright by passing the `page` option:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import puppeteer from "puppeteer-core";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
});
await stagehand.init();

// Connect with Puppeteer
const browser = await puppeteer.connect({
  browserWSEndpoint: stagehand.connectURL(),
  defaultViewport: null,
});

const pages = await browser.pages();
const customPage = pages[0];

await customPage.goto("https://www.example.com/products");

// Use observe with the custom Puppeteer page
const actions = await stagehand.observe("find all product cards", {
  page: customPage
});
```

This works with:
- **Puppeteer**: Pass Puppeteer Page objects
- **Playwright**: Pass Playwright Page objects
- **Patchright**: Pass Patchright Page objects
- **Stagehand Context Pages**: Access pages via `stagehand.context.pages()` (default)

<Card title="Complete API Reference" icon="book" href="/v3/references/observe">
  See the full `observe()` reference for detailed parameter documentation, return values, and advanced examples.
</Card>

## Best practices

### Plan then execute

Discover all actions once, then execute without additional LLM calls. This approach is 2-3x faster than separate `act()` calls.

```typescript
const formFields = await stagehand.observe("find all form input fields");

for (const field of formFields) {
  await stagehand.act(field); // No LLM call
}
```

<Card title="Analyze pages with observe()" icon="magnifying-glass" href="/v3/references/observe">
  Complete guide to planning actions with `observe()`.
</Card>

### Scope extractions

Use `observe()` to narrow extraction scope and reduce token usage by up to 10x.

```typescript
const [table] = await stagehand.observe("find the pricing table");

const pricing = await stagehand.extract({
  instruction: "extract all pricing tiers",
  schema: PricingSchema,
  selector: table.selector
});
```

<Card title="Extract structured data" icon="table" href="/v3/basics/extract">
  Learn how to use `observe()` with `extract()` for precise data extraction.
</Card>

### Validate before acting

Check elements exist and verify their properties before performing critical operations.

```typescript
const [deleteButton] = await stagehand.observe("find the delete account button");

if (deleteButton?.method === "click") {
  await stagehand.act(deleteButton);
} else {
  throw new Error("Delete button not found");
}
```

<Card title="Execute actions with act()" icon="play" href="/v3/basics/act">
  Learn how to execute observed actions reliably.
</Card>

### Cache observed actions

Store and reuse observed actions to eliminate redundant LLM calls. Build a simple cache:

```typescript
const actionCache = new Map<string, Action[]>();

async function cachedObserve(instruction: string) {
  if (actionCache.has(instruction)) {
    return actionCache.get(instruction)!;
  }

  const actions = await stagehand.observe(instruction);
  actionCache.set(instruction, actions);
  return actions;
}
```

<Card title="Complete caching guide" icon="database" href="/v3/best-practices/caching">
  Learn advanced caching techniques and patterns for optimal performance.
</Card>

## Troubleshooting

<AccordionGroup>

<Accordion title="No elements found">
**Problem**: `observe()` returns empty array

**Solutions**:
- Verify the element exists on the page
- Use more specific instructions (e.g., "find the blue submit button" instead of "find button")
- Ensure page has fully loaded before calling `observe()`
- Enable verbose logging in Stagehand configuration to inspect detection behavior

```typescript
// Check page state before observing
const page = stagehand.context.pages()[0];
await page.waitForLoadState('domcontentloaded');

const actions = await stagehand.observe("find the submit button");

if (actions.length === 0) {
  console.log("No elements found, trying alternative instruction");
  const altActions = await stagehand.observe("find the button at the bottom of the form");
}
```
</Accordion>

<Accordion title="Inaccurate results">
**Problem**: Descriptions or selectors don't match actual elements

**Solutions**:
- Use more capable models—check [model evals](https://stagehand.dev/evals) for recommendations
- Provide more context in your instruction (e.g., "find the submit button in the checkout form")
- Enable verbose logging and `logInferenceToFile` in Stagehand configuration to inspect LLM reasoning

```typescript
// More specific instructions improve accuracy
// Instead of:
await stagehand.observe("find the button");

// Use context:
await stagehand.observe("find the red 'Delete' button in the user settings panel");
```
</Accordion>

<Accordion title="Wrong method suggested">
**Problem**: The `method` field has an unexpected value

**Solutions**:
- Validate the method before using it: `if (action.method === "click") { ... }`
- Check [supported actions](/v3/basics/act) for valid method names
- Override with a specific method when needed: `await stagehand.act({ ...action, method: "click" })`

```typescript
const [action] = await stagehand.observe("find the submit button");

// Validate method before acting
const validMethods = ["click", "fill", "type", "press"];
if (action && validMethods.includes(action.method || "")) {
  await stagehand.act(action);
} else {
  console.warn(`Unexpected method: ${action?.method}`);
}
```
</Accordion>

</AccordionGroup>

## Next steps

<CardGroup cols={2}>
  <Card title="Execute actions with act()" icon="play" href="/v3/basics/act">
    Use `act()` to execute discovered actions reliably.
  </Card>

  <Card title="Extract structured data" icon="table" href="/v3/basics/extract">
    Combine `observe()` with `extract()` for precise data extraction.
  </Card>

  <Card title="Caching actions" icon="bolt" href="/v3/best-practices/caching">
    Build action caches to eliminate redundant LLM calls.
  </Card>

  <Card title="Complete API Reference" icon="book" href="/v3/references/observe">
    Full `observe()` reference with detailed parameter documentation.
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/best-practices/agent-fallbacks.mdx
================================================
---
title: Agent Fallbacks
description: "A failsafe when unexpected page changes add extra steps"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## When to use

Use an agent fallback as a failsafe when a one step action unexpectedly becomes a multi-step flow.

## How it works

1. [`act()`](/v3/basics/act) is attempted for the direct action
2. If it fails, [`agent()`](/v3/basics/agent) figures out the new path
3. Agent completes all needed steps (open menu → click button)

### Example scenario

**Before**: Sign in button was in the header  
**After**: Sign in now requires: Click account menu → Click "Sign in" option

A single `act("click sign in")` can't handle this change. The agent fallback can discover and execute both steps.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

try {
  await stagehand.act("click the 'Sign In' button");
} catch (err) {
  console.log("Agent fallback triggered");

  const agent = stagehand.agent({
    model: "anthropic/claude-sonnet-4-20250514",
    systemPrompt: "You are a helpful assistant that can use a web browser.",
  });

  const result = await agent.execute({
    instruction: "Find and click Sign In button",
    maxSteps: 10,
  });

  console.log(result.success ? "Agent fallback success" : "Agent fallback failed");

  if (!result.success) throw err;
}
```

See all available agent models on the [models page](/v3/configuration/models#agent-models-with-cua-support).


================================================
FILE: packages/docs/v3/best-practices/caching.mdx
================================================
---
title: Caching Actions
description: Cache actions automatically to reduce costs and improve performance
---

import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />

Stagehand supports two caching strategies to reduce LLM costs and speed up your automations: **Browserbase Cache** and **Local Cache**. They serve different use cases and can be used independently or together.

---

## Browserbase Cache

Browserbase Cache is a managed, server-side caching layer built into the Stagehand API. When you run Stagehand with `env: "BROWSERBASE"`, every `act()` call is automatically cached on Browserbase's servers. Repeated calls with the same inputs return instantly without consuming any LLM tokens. You don't need to configure anything to start benefiting.

The cache key is generated from the instruction, page content, and options you pass. On a cache hit, the response is returned directly from the server with no LLM inference and no token cost. You can inspect cache behavior via the `cacheStatus` field returned by `act()`. Check out the [Browserbase blog](https://www.browserbase.com/blog/stagehand-caching) for more details on how it works under the hood.

### Disabling on the Constructor

Pass `serverCache: false` to disable caching for all requests made by that instance:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  serverCache: false,
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

// Cache is disabled, always hits the LLM
await stagehand.act("click the login button");
```

### Disabling per Call

Override the instance setting for a single call by passing `serverCache: false` in the options:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "BROWSERBASE" }); // caching on by default

await stagehand.init();
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

// This call skips the cache
await stagehand.act("click the login button", { serverCache: false });

// This call uses the cache as normal
await stagehand.act("submit the form");
```

### Inspecting Cache Status

`act()` returns a `cacheStatus` field you can use to verify whether a result was served from cache:

```typescript
const actResult = await stagehand.act("click the login button");
console.log(actResult.cacheStatus); // "HIT" or "MISS"
```

### Limitations

- The page URL factors in to the cache key. If the action is being made on a page with a dynamic URL, caching may not work as expected. We do filter out certain query parameters like referral trackers and analytics, but we don't catch everything just yet.
- If the page content or structure changes, the action won't get a cache `HIT` and the LLM will be called. The subsequent actions will attempt to hit the resulting cache entry.

---

## Local Cache

Local Cache writes action results to your filesystem so they persist across script runs. It works in both `LOCAL` and `BROWSERBASE` environments. When you specify a `cacheDir`, Stagehand saves every action and agent step to a local file on first run, then replays those cached actions on subsequent runs with no LLM calls, no token cost, and no network round-trip to Browserbase.

This is especially useful for:

- **CI/CD pipelines** - commit your cache directory to version control for consistent, deterministic runs across environments
- **Local development** - iterate on automations without burning tokens on repeated runs
- **Cross-machine sharing** - cache files are portable and can be shared across machines

### Caching with `act()`

Cache actions from `act()` by specifying a cache directory in your Stagehand constructor.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "act-cache", // Specify a cache directory
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://browserbase.github.io/stagehand-eval-sites/sites/iframe-same-proc-scroll/");

// First run: uses LLM inference and caches
// Subsequent runs: reuses cached action
await stagehand.act("scroll to the bottom of the iframe");

// Variables work with caching too
await stagehand.act("fill the username field with %username%", {
  variables: {
    username: "fakeUsername",
  },
});
```

### Caching with `agent()`

Cache agent actions (including Computer Use Agent actions) the same way. Just specify a `cacheDir`. The cache key is automatically generated based on the instruction, start URL, agent execution options, and agent configuration. Subsequent runs with the same parameters will reuse cached actions.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "agent-cache", // Specify a cache directory
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://browserbase.github.io/stagehand-eval-sites/sites/drag-drop/");

const agent = stagehand.agent({
  mode: "cua",
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
  },
  systemPrompt: "You are a helpful assistant that can use a web browser.",
});

await page.goto("https://play2048.co/");

// First run: uses LLM inference and caches
// Subsequent runs: reuses cached actions
const result = await agent.execute({
  instruction: "play a game of 2048",
  maxSteps: 20,
});

console.log(JSON.stringify(result, null, 2));
```

### Cache Directory Organization

You can organize your caches by using different directory names for different workflows:

```typescript
// Separate caches for different parts of your automation
const loginStagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/login-flow"
});

const checkoutStagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/checkout-flow"
});

const dataExtractionStagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/data-extraction"
});
```

### Best Practices

<AccordionGroup>

<Accordion title="Use descriptive cache directories">
Organize caches by workflow or feature for easier management:

```typescript
// Good: descriptive cache names
cacheDir: "cache/login-actions"
cacheDir: "cache/search-actions"
cacheDir: "cache/form-submissions"

// Avoid: generic cache names
cacheDir: "cache"
cacheDir: "my-cache"
```
</Accordion>

<Accordion title="Clear cache when DOM changes">
If the website structure changes significantly, clear your cache directory to force fresh inference:

```bash
rm -rf cache/login-actions
```

Or programmatically:

```typescript
import { rmSync } from 'fs';

// Clear cache before running if needed
if (shouldClearCache) {
  rmSync('cache/login-actions', { recursive: true, force: true });
}

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/login-actions"
});
```
</Accordion>

<Accordion title="Commit cache for CI/CD">
Consider committing your cache directory to version control for consistent behavior across environments:

```gitignore
# .gitignore
# Don't ignore cache directories
!cache/
```

This ensures your CI/CD pipelines use the same cached actions without needing to run inference on first execution.
</Accordion>

</AccordionGroup>


================================================
FILE: packages/docs/v3/best-practices/computer-use.mdx
================================================
---
title: Computer Use Agents
description: Incorporate Computer Use APIs from Google, Anthropic, OpenAI, and Microsoft with one line of code in Stagehand.
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## What is a Computer Use Agent?

<iframe
  width="100%"
  height="400"
  src="https://www.youtube.com/embed/ODaHJzOyVCQ"
  title="YouTube video player"
  frameborder="0"
  allow="accelerometer; autoplay; clipboard-write; encrypted-media; gyroscope; picture-in-picture"
  allowfullscreen
></iframe>
You might've heard of [Gemini Computer Use](https://blog.google/technology/google-deepmind/gemini-computer-use-model/), [Claude Computer Use](https://www.anthropic.com/news/3-5-models-and-computer-use), or [OpenAI's Computer Using Agent](https://openai.com/index/computer-using-agent/).

These are powerful tools that can convert natural language into actions on the computer. However, you'd otherwise need to write your own code to convert these actions into Playwright commands.

Stagehand not only handles the execution of Computer Use outputs, but also lets you hot-swap between Google, OpenAI, Anthropic, and Microsoft models with one line of code. You can find more information on the performance of different computer use models by visiting our [evals page](https://www.stagehand.dev/agent-evals).

## How to use a Computer Use Agent in Stagehand

Stagehand lets you use Computer Use Agents with one line of code:

<Warning>
**Deprecation Notice:** The `cua: true` option is deprecated and will be removed in a future version. Use `mode: "cua"` instead.
</Warning>

<Note>
**IMPORTANT! Configure your browser dimensions**

Computer Use Agents will often return XY-coordinates to click on the screen, so you'll need to configure your browser dimensions.

If not specified, the default browser dimensions are 1288 x 711. You can also configure the browser dimensions in the `browserbaseSessionCreateParams` or `localBrowserLaunchOptions` options.
</Note>


### Configuring browser dimensions

Browser configuration differs by environment:

<Tabs>
<Tab title="BROWSERBASE">
```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
	env: "BROWSERBASE",
    model: "google/gemini-2.5-flash",
  
    browserbaseSessionCreateParams: {
      projectId: process.env.BROWSERBASE_PROJECT_ID!,
      browserSettings: {
		blockAds: true,
        viewport: {
          width: 1288,
          height: 711,
        },
      },
  	},
});

await stagehand.init();
```
</Tab>
<Tab title="LOCAL">
```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    headless: false,
    viewport: {
      width: 1288,
      height: 711,
    },
  }
});

await stagehand.init();
```
</Tab>
</Tabs>

### Direct your Computer Use Agent

Call `execute` on the agent to assign a task to the agent.

<CodeGroup>
```typescript Google
await page.goto("https://www.google.com/");
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "google/gemini-2.5-computer-use-preview-10-2025",
        apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
    },
    systemPrompt: "You are a helpful assistant...",
});

await agent.execute({
    instruction: "Go to Hacker News and find the most controversial post from today, then read the top 3 comments and summarize the debate.",
    maxSteps: 20,
    highlightCursor: true
})
```

```typescript OpenAI
await page.goto("https://www.google.com/");
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "openai/computer-use-preview",
        apiKey: process.env.OPENAI_API_KEY
    },
    systemPrompt: "You are a helpful assistant...",
});

await agent.execute({
    instruction: "Go to Hacker News and find the most controversial post from today, then read the top 3 comments and summarize the debate.",
    maxSteps: 20,
    highlightCursor: true
})
```
```typescript Anthropic
await page.goto("https://www.google.com/");
const agent = stagehand.agent({
    mode: "cua",
    model: {
        modelName: "anthropic/claude-sonnet-4-20250514",
        apiKey: process.env.ANTHROPIC_API_KEY
    },
    systemPrompt: "You are a helpful assistant...",
});

await agent.execute({
    instruction: "Go to Hacker News and find the most controversial post from today, then read the top 3 comments and summarize the debate.",
    maxSteps: 20,
    highlightCursor: true
})
```
</CodeGroup>

You can define the maximum number of steps the agent can take with `maxSteps`:

```typescript
await agent.execute({
	instructions: "Apply for a library card at the San Francisco Public Library",
	maxSteps: 10,
});
``` 

### Select Your Computer Use Model

Stagehand supports computer use models from Google, Anthropic, OpenAI, and Microsoft. You can find all supported models on the [models page](/v3/configuration/models#agent-models-with-cua-support).

<Tabs>
<Tab title="Google">
```typescript
const agent = stagehand.agent({
    mode: "cua",
    model: "google/gemini-2.5-computer-use-preview-10-2025",
    // GOOGLE_GENERATIVE_AI_API_KEY is auto-loaded - set in your .env
});
```
</Tab>
<Tab title="Anthropic">
```typescript
const agent = stagehand.agent({
    mode: "cua",
    model: "anthropic/claude-sonnet-4-20250514",
    // ANTHROPIC_API_KEY is auto-loaded - set in your .env
});
```
</Tab>
<Tab title="OpenAI">
```typescript
const agent = stagehand.agent({
    mode: "cua",
    model: "openai/computer-use-preview",
    // OPENAI_API_KEY is auto-loaded - set in your .env
});
```
</Tab>
</Tabs>

<Callout icon="code" color="#6ec202" iconType="regular">View or run the example templates [here](https://www.browserbase.com/templates?category=Computer+Use+Agents)</Callout>


================================================
FILE: packages/docs/v3/best-practices/cost-optimization.mdx
================================================
---
title: Cost Optimization  
sidebarTitle: Cost Optimization
description: Minimize costs while maintaining automation performance
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Cost optimization in Stagehand involves balancing LLM inference costs and browser infrastructure costs. This guide provides practical strategies to reduce your automation expenses.

## Quick Wins

Start with these simple optimizations that can reduce costs:

### 1. Use the Right Model for the Job

We don't recommend using larger, more premium models for simple tasks. See our [evaluation results](https://stagehand.dev/evals) for model performance and cost comparisons across different task types.

<CardGroup cols={2}>
<Card title="Model Selection Guide" icon="brain" href="/configuration/models">
  Choose the right LLM for your budget and accuracy requirements
</Card>
<Card title="Evaluation Results" icon="chart-line" href="https://www.stagehand.dev/evals">
  See how different models perform on different tasks
</Card>
</CardGroup>

### 2. Implement Caching

Enable automatic action caching to eliminate redundant LLM calls. Simply specify a `cacheDir` when initializing Stagehand:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "action-cache", // Enable automatic caching
});

await stagehand.init();

// First run: uses LLM inference and caches
// Subsequent runs: reuses cached action (no LLM cost)
await stagehand.act("Click the sign in button");
```

<CardGroup cols={1}>
<Card title="Caching Guide" icon="database" href="/best-practices/caching">
  Learn how to organize caches and manage cache directories
</Card>
</CardGroup>

### 3. Optimize Browser Sessions

Reuse sessions when possible and set appropriate timeouts. See [Browser Configuration](/configuration/browser) for details:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionCreateParams: {
    timeout: 1800, // 30 minutes instead of default 1 hour
    keepAlive: true, // Keep session alive between tasks
  }
});
```

<CardGroup cols={1}>
<Card title="Browserbase Cost Optimization" icon="window-maximize" href="https://docs.browserbase.com/guides/cost-optimization">
  Optimize Browserbase infrastructure costs and session management
</Card>
</CardGroup>

## Advanced Strategies

### Intelligent Model Switching

Automatically fall back to cheaper models for simple tasks:

```typescript
// Use models from least to most expensive based on task complexity
// See stagehand.dev/evals for performance comparisons
async function smartAct(prompt: string) {
  const models = ["google/gemini-2.5-flash", "openai/gpt-4o"];

  for (const model of models) {
    try {
      const stagehand = new Stagehand({
        env: "LOCAL",
        model: model
      });
      await stagehand.init();
      const [action] = await stagehand.observe(prompt);
      await stagehand.act(action);
      await stagehand.close();
      return;
    } catch (error) {
      console.log(`Falling back to ${model}...`);
      await stagehand.close();
    }
  }
}
```

### Session Pooling

Reuse browser sessions across multiple tasks:

```typescript
class SessionManager {
  private sessions = new Map<string, Stagehand>();
  
  async getSession(taskType: string): Promise<Stagehand> {
    if (this.sessions.has(taskType)) {
      return this.sessions.get(taskType)!;
    }
    
    const stagehand = new Stagehand({ env: "BROWSERBASE" });
    await stagehand.init();
    this.sessions.set(taskType, stagehand);
    return stagehand;
  }
}
```

## Cost Monitoring

Track your spending to identify optimization opportunities. See our [Observability Guide](/configuration/observability) for detailed metrics:

```typescript
// Monitor token usage
const metrics = await stagehand.metrics;
console.log(`Total tokens: ${metrics.totalPromptTokens + metrics.totalCompletionTokens}`);
console.log(`Estimated cost: $${(metrics.totalPromptTokens + metrics.totalCompletionTokens) * 0.00001}`);
```

<CardGroup cols={1}>
<Card title="Observability & Metrics" icon="chart-line" href="/configuration/observability">
  Monitor usage patterns and track costs in real-time
</Card>
</CardGroup>

## Budget Controls

Set spending limits to prevent unexpected costs:

```typescript
class BudgetGuard {
  private dailySpend = 0;
  private maxDailyBudget: number;
  
  constructor(maxDailyBudget: number = 25) {
    this.maxDailyBudget = maxDailyBudget;
  }
  
  checkBudget(estimatedCost: number): void {
    if (this.dailySpend + estimatedCost > this.maxDailyBudget) {
      throw new Error(`Daily budget exceeded: $${this.maxDailyBudget}`);
    }
    this.dailySpend += estimatedCost;
  }
}
```


## Related Resources

<CardGroup cols={2}>
<Card title="Model Selection Guide" icon="brain" href="/configuration/models">
  Choose the right LLM for your budget and accuracy requirements
</Card>

<Card title="Caching Strategies" icon="database" href="/best-practices/caching">
  Reduce costs with smart action caching and observe patterns
</Card>

<Card title="Observability & Metrics" icon="chart-line" href="/configuration/observability">
  Monitor usage patterns and track costs in real-time
</Card>

<Card title="Browser Configuration" icon="window-maximize" href="/configuration/browser">
  Optimize Browserbase infrastructure costs and session management
</Card>
</CardGroup>

================================================
FILE: packages/docs/v3/best-practices/deployments.mdx
================================================
---
title: 'Deploying Stagehand'
description: 'Deploy your AI agents and automations to the cloud'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<Tip>
**🌟 Preview: Browser Functions** - Deploy your web automation code directly on Browserbase with browser functions. Scale your `act()` automations in the cloud with zero infrastructure setup. Reach out to hello@browserbase.com to get beta access.
</Tip>

## Deploy on Vercel

Securely run Stagehand on Browserbase inside a Vercel Function. This guide shows a minimal, production-safe HTTP endpoint you can call directly or on a schedule.

### 1. Install Vercel CLI

To download and install Vercel CLI, run one of the following commands:

<CodeGroup>
```bash pnpm
pnpm i -g vercel
```
```bash yarn
yarn global add vercel
```
```bash npm
npm i -g vercel
```
```bash bun
bun add -g vercel
```
</CodeGroup>

### 2. Project layout

```text
your-project/
  api/
    run.ts
  package.json
  tsconfig.json
  vercel.json
```

Create the structure with:

```bash
mkdir -p api
touch api/run.ts package.json vercel.json tsconfig.json
```

### 3. `api/run.ts` (Node.js runtime)

```typescript
// api/run.ts
import type { VercelRequest, VercelResponse } from "@vercel/node";
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod";

export default async function handler(req: VercelRequest, res: VercelResponse): Promise<void> {
  try {
    const stagehand = new Stagehand({
      env: "BROWSERBASE",
      apiKey: process.env.BROWSERBASE_API_KEY!,
      projectId: process.env.BROWSERBASE_PROJECT_ID!,
      disablePino: true,
      model: {
        modelName: "google/gemini-2.5-flash",
        apiKey: process.env.GOOGLE_API_KEY!,
      },
      // optional session params
      browserbaseSessionCreateParams: {
        projectId: process.env.BROWSERBASE_PROJECT_ID!,
        region: "us-west-2",
        browserSettings: {
          blockAds: true,
        },
      },
    });

    await stagehand.init();
    const page = stagehand.context.pages()[0];

    await page.goto("https://www.stagehand.dev/");
    await stagehand.act("click the evals button");

    const fastestModel = await stagehand.extract("extract the fastest model", z.string());

    await stagehand.close();

    res.status(200).json({ ok: true, data: fastestModel });
  } catch (err: unknown) {
    const msg = err instanceof Error ? err.message : String(err);
    res.status(500).json({ ok: false, error: msg });
  }
}
```

### 4. `package.json`

```json
{
    "name": "bb-stagehand-on-vercel",
    "private": true,
    "type": "module",
    "engines": { "node": ">=18" },
    "dependencies": {
      "@browserbasehq/stagehand": "^3.0.0"
    },
    "devDependencies": {
      "@types/node": "^20.12.12",
      "@vercel/node": "^3.2.20",
      "typescript": "^5.2.2"
    }
}
```

### 5. `tsconfig.json`

```json
{
  "compilerOptions": {
    "target": "ES2022",
    "module": "ES2022",
    "moduleResolution": "node",
    "outDir": ".vercel/output/functions",
    "strict": true,
    "esModuleInterop": true,
    "skipLibCheck": true,
    "types": ["node"]
  },
  "include": ["api/**/*.ts"]
}
```

### 6. `vercel.json`

```json
{
  "$schema": "https://openapi.vercel.sh/vercel.json",
  "functions": {
    "api/run.ts": {
      "maxDuration": 60
    }
  }
}
```

See Vercel's [configuring functions](https://vercel.com/docs/functions/configuring-functions) docs for more details.

### 7. Link your project

Link your local folder to a Vercel project before configuring environment variables:

```bash
# authenticate if needed
vercel login

# link the current directory to a Vercel project (interactive)
vercel link
```

### 8. Environment variables

Do not commit `.env` in production. Add variables via Vercel CLI:

```bash
vercel env add BROWSERBASE_API_KEY
vercel env add BROWSERBASE_PROJECT_ID
# (and your model key if needed)
vercel env add GOOGLE_API_KEY
```

See also: [Browser Environment](/configuration/environment) for details on required variables.

### 9. Test locally

Replicate the Vercel environment locally to exercise your Function before deploying. Run from the project root.

```bash
# ensure dependencies are installed
npm install

# start the local Vercel dev server
vercel dev --listen 5005
```

### 10. Deploy

```bash
vercel
vercel --prod
```

### Execute the function

#### Configure Protection Bypass for Automation

Before invoking the production URL, create a Protection Bypass for Automation:

1. Generate a 32-character secret (you can use `openssl rand -hex 16`)
2. Go to your project in Vercel
3. Navigate to Settings → Deployment Protection
4. Add the secret to "Protection Bypass for Automation"

Then invoke the function with the bypass header:

```bash
curl -X POST \
  -H "x-vercel-protection-bypass: <your-32-character-secret>" \
  https://<your-deployment>/api/run
```

### Optional: Cron on Vercel

Hit the same endpoint on a schedule by extending `vercel.json`:

```json
{
  "$schema": "https://openapi.vercel.sh/vercel.json",
  "functions": {
    "api/run.ts": {
      "maxDuration": 60
    }
  }
  },
  "crons": [
    { "path": "/api/run", "schedule": "0 * * * *" }
  ]
}
```

### Features
- **No local browsers needed** with `env: "BROWSERBASE"`. [Browserbase](https://www.browserbase.com/) provides the browsers.
- **Fast functionality**: Offload browser work to Browserbase and return JSON promptly.
- **Long-running tasks**: Raise `maxDuration` and/or consider Edge runtime limits depending on plan.


================================================
FILE: packages/docs/v3/best-practices/deterministic-agent.mdx
================================================
---
title: Deterministic Agent Scripts
sidebarTitle: Deterministic Agent
description: Use auto-caching to convert agent workflows into fast, deterministic scripts
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Agent workflows are powerful for exploring and automating complex tasks, but they can be slow and non-deterministic. This guide shows you how to use Stagehand's built-in auto-caching to convert agent-discovered workflows into fast, deterministic scripts that run 10-100x faster.

## Why Use Auto-Caching with Agent?

<CardGroup cols={2}>
  <Card title="Speed" icon="bolt">
    Cached agent workflows run 10-100x faster by skipping LLM inference on subsequent runs
  </Card>
  <Card title="Cost" icon="dollar-sign">
    Eliminate repeated LLM calls—first run uses inference, subsequent runs use cache
  </Card>
  <Card title="Reliability" icon="shield-check">
    Cached actions are deterministic and more predictable than fresh agent exploration
  </Card>
  <Card title="Simplicity" icon="wand-magic-sparkles">
    Works automatically—just specify `cacheDir` and Stagehand handles everything
  </Card>
</CardGroup>

## How Auto-Caching Works

When you specify a `cacheDir`:

1. **First run**: Agent explores and executes workflow using LLM inference
2. **Actions cached**: All actions are automatically saved to local cache
3. **Subsequent runs**: Same workflow reuses cached actions (no LLM calls)
4. **Performance**: 10-100x faster execution, zero LLM tokens

The cache key is automatically generated based on:
- Agent instruction
- Start URL
- Agent execution options
- Agent configuration

## Basic Auto-Caching with Agent

Simply add `cacheDir` when initializing Stagehand:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Enable auto-caching
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "agent-cache" // Automatic caching enabled
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

const agent = stagehand.agent({
  mode: "cua",
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
  },
  systemPrompt: "You are a helpful assistant that can use a web browser.",
});

// First run: Uses LLM inference (~20-30 seconds, ~50,000 tokens)
// Subsequent runs: Uses cached actions (~2-3 seconds, 0 tokens)
const result = await agent.execute({
  instruction: "Find the login form, fill in username 'demo' and password 'test123', then click submit",
  maxSteps: 10
});

console.log("Completed:", result.success);
console.log("Actions taken:", result.actions.length);

await stagehand.close();
```

That's it! The second time you run this script, it will reuse the cached agent actions automatically.

## Organizing Caches by Workflow

Use descriptive cache directories for different workflows:

```typescript
// Login workflow
const loginStagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/login-workflow"
});

// Checkout workflow
const checkoutStagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/checkout-workflow"
});

// Data extraction workflow
const extractStagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/extraction-workflow"
});
```

## Complete Example: First vs Subsequent Runs

### First Run (Exploration Mode)

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/github-search" // Enable caching
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://github.com");

const agent = stagehand.agent({
  mode: "cua",
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
  },
  systemPrompt: "You are a helpful assistant that can use a web browser.",
});

console.log("First run: Exploring with agent...");
const startTime = Date.now();

const result = await agent.execute({
  instruction: "Search for 'stagehand' and click the first repository result",
  maxSteps: 10
});

const duration = Date.now() - startTime;
console.log(`First run completed in ${duration}ms`);
console.log(`Actions: ${result.actions.length}`);
console.log(`Status: ${result.success}`);

await stagehand.close();

// Output (example):
// First run completed in 25000ms
// Actions: 8
// Status: true
```

### Subsequent Runs (Cached Mode)

Run the **exact same script** again:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/github-search" // Same cache directory
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://github.com");

const agent = stagehand.agent({
  mode: "cua",
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
  },
  systemPrompt: "You are a helpful assistant that can use a web browser.",
});

console.log("Subsequent run: Using cached actions...");
const startTime = Date.now();

const result = await agent.execute({
  instruction: "Search for 'stagehand' and click the first repository result",
  maxSteps: 10
});

const duration = Date.now() - startTime;
console.log(`Subsequent run completed in ${duration}ms`);
console.log(`Actions: ${result.actions.length}`);
console.log(`Status: ${result.success}`);

await stagehand.close();

// Output (example):
// Subsequent run completed in 2500ms  ← 10x faster!
// Actions: 8
// Status: true
```

## Using History for Analysis

While caching handles execution automatically, you can still use `stagehand.history` to analyze what happened:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import fs from "fs/promises";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/workflow"
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

const agent = stagehand.agent({
  mode: "cua",
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GOOGLE_GENERATIVE_AI_API_KEY
  },
  systemPrompt: "You are a helpful assistant that can use a web browser.",
});

await agent.execute({
  instruction: "Complete the login process",
  maxSteps: 10
});

// Analyze what the agent did
const history = await stagehand.history;

console.log(`\nWorkflow Analysis:`);
console.log(`Total operations: ${history.length}`);

const agentOps = history.filter(e => e.method === 'agent');
const actOps = history.filter(e => e.method === 'act');
const navOps = history.filter(e => e.method === 'navigate');

console.log(`- Agent executions: ${agentOps.length}`);
console.log(`- Act operations: ${actOps.length}`);
console.log(`- Navigate operations: ${navOps.length}`);

// Save for documentation
await fs.writeFile(
  'workflow-analysis.json',
  JSON.stringify(history, null, 2)
);

await stagehand.close();
```

## Cache Management

### Clear Cache When Site Changes

If the website structure changes, clear the cache to force fresh exploration:

```typescript
import { rmSync } from 'fs';

// Clear specific workflow cache
rmSync('cache/login-workflow', { recursive: true, force: true });

// Then run with fresh exploration
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/login-workflow" // Will rebuild cache
});
```

### Programmatic Cache Control

```typescript
import { rmSync, existsSync } from 'fs';

function clearCacheIfNeeded(cacheDir: string, maxAge: number = 7 * 24 * 60 * 60 * 1000) {
  if (!existsSync(cacheDir)) {
    return; // No cache to clear
  }

  const stats = statSync(cacheDir);
  const age = Date.now() - stats.mtimeMs;

  if (age > maxAge) {
    console.log(`Cache older than ${maxAge}ms, clearing...`);
    rmSync(cacheDir, { recursive: true, force: true });
  }
}

// Clear cache if older than 7 days
clearCacheIfNeeded('cache/workflow');

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/workflow"
});
```

## Advanced Patterns
 
### Fallback to Fresh Exploration

Combine caching with fallback for resilience:

```typescript
async function executeWithFallback() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    cacheDir: "cache/workflow",
    selfHeal: true // Enable self-healing
  });

  await stagehand.init();
  const page = stagehand.context.pages()[0];

  await page.goto("https://example.com");

  const agent = stagehand.agent({
    model: "anthropic/claude-sonnet-4-20250514"
  });

  try {
    // Try with cache
    const result = await agent.execute({
      instruction: "Complete the checkout process",
      maxSteps: 15
    });

    console.log("Execution successful:", result.success);
  } catch (error) {
    console.error("Cached workflow failed:", error);

    // Clear cache and retry with fresh exploration
    rmSync('cache/workflow', { recursive: true, force: true });

    console.log("Retrying with fresh exploration...");
    const retryResult = await agent.execute({
      instruction: "Complete the checkout process",
      maxSteps: 15
    });

    console.log("Retry successful:", retryResult.success);
  }

  await stagehand.close();
}
```

### Version Control for Caches

Commit cache directories to ensure consistent behavior across environments:

```gitignore
# .gitignore

# Commit cache directories for deterministic CI/CD
!cache/
!cache/**/*.json
```

```typescript
// CI/CD pipeline will use pre-generated cache
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/production-workflow" // Committed to repo
});
```

## Best Practices

<AccordionGroup>

<Accordion title="Use Descriptive Cache Names">
Organize caches by workflow or feature:

```typescript
// Good: descriptive cache names
cacheDir: "cache/user-registration"
cacheDir: "cache/product-search"
cacheDir: "cache/checkout-flow"

// Avoid: generic names
cacheDir: "cache"
cacheDir: "my-cache"
```
</Accordion>

<Accordion title="Cache Invalidation Strategy">
Implement a strategy for refreshing caches:

```typescript
// Option 1: Time-based invalidation
if (isCacheOlderThan('cache/workflow', 7)) {
  clearCache('cache/workflow');
}

// Option 2: Version-based invalidation
const CACHE_VERSION = 'v2';
const cacheDir = `cache/workflow-${CACHE_VERSION}`;

// Option 3: Manual invalidation flag
if (process.env.CLEAR_CACHE === 'true') {
  clearCache('cache/workflow');
}
```
</Accordion>

<Accordion title="Test in Staging First">
Always test cached workflows in staging before production:

```typescript
const env = process.env.NODE_ENV === 'production' ? 'production' : 'staging';

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: `cache/${env}-workflow`
});
```
</Accordion>

<Accordion title="Monitor Cache Hit Rates">
Track cache usage for optimization:

```typescript
const cacheHit = existsSync('cache/workflow') &&
                statSync('cache/workflow').mtimeMs < Date.now();

if (cacheHit) {
  console.log("Cache hit - using cached workflow");
} else {
  console.log("Cache miss - exploring with agent");
}

// Log metrics
metrics.recordCacheHit(cacheHit);
```
</Accordion>

</AccordionGroup>

## Performance Comparison

**Without Caching (Every Run):**
```typescript
const stagehand = new Stagehand({ env: "BROWSERBASE" });
// No cacheDir specified

const result = await agent.execute({
  instruction: "Complete workflow",
  maxSteps: 10
});

// Every run: ~20-30 seconds, ~50,000 tokens
```

**With Auto-Caching (First Run):**
```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/workflow"
});

const result = await agent.execute({
  instruction: "Complete workflow",
  maxSteps: 10
});

// First run: ~20-30 seconds, ~50,000 tokens (cached for next time)
```

**With Auto-Caching (Subsequent Runs):**
```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/workflow" // Reuses cache
});

const result = await agent.execute({
  instruction: "Complete workflow",
  maxSteps: 10
});

// Subsequent runs: ~2-3 seconds, 0 tokens ← 10-100x faster!
```

<Note>
Cached agent workflows run **10-100x faster** and consume **zero LLM tokens** on subsequent runs. The first run pays the exploration cost, every run after is nearly instant.
</Note>

## Troubleshooting

<AccordionGroup>
<Accordion title="Cache not being used">
**Problem**: Workflow still slow on subsequent runs

**Solutions**:
- Verify `cacheDir` path is correct and consistent across runs
- Ensure instruction, URL, and agent config are identical
- Check file permissions on cache directory
- Look for cache hit/miss logs in verbose mode

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/workflow",
  verbose: 2 // Enable debug logs
});
```
</Accordion>

<Accordion title="Cached workflow fails">
**Problem**: Cached actions fail on subsequent runs

**Solutions**:
- Website may have changed—clear cache to re-explore
- Enable self-healing to adapt to minor changes
- Implement fallback logic to retry with fresh exploration

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  cacheDir: "cache/workflow",
  selfHeal: true // Adapt to changes
});
```
</Accordion>

<Accordion title="Too many cache directories">
**Problem**: Cache directories growing uncontrolled

**Solutions**:
- Use version prefixes for cache directories
- Implement automatic cleanup of old caches
- Share cache directories for similar workflows

```typescript
// Versioned caches
const CACHE_VERSION = '2024-01';
const cacheDir = `cache/workflow-${CACHE_VERSION}`;

// Cleanup old versions
rmSync('cache/workflow-2023-12', { recursive: true, force: true });
```
</Accordion>
</AccordionGroup>

## Next Steps

<CardGroup cols={2}>
  <Card title="Agent Guide" icon="robot" href="/v3/basics/agent">
    Learn more about agent capabilities and configuration
  </Card>

  <Card title="Caching Guide" icon="database" href="/v3/best-practices/caching">
    Complete guide to auto-caching with act() and agent()
  </Card>

  <Card title="Observability" icon="chart-line" href="/v3/configuration/observability">
    Monitor and track history and metrics
  </Card>

  <Card title="Speed Optimization" icon="bolt" href="/v3/best-practices/speed-optimization">
    Additional techniques for faster automation
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/best-practices/history.mdx
================================================
---
title: History Tracking
sidebarTitle: History Tracking
description: Track and analyze Stagehand operations with the history API
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


The history API captures every Stagehand operation for debugging, auditing, and workflow analysis.

## Basic Usage

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");
await stagehand.act("click login button");

// Get complete history
const history = await stagehand.history;

console.log(`Total operations: ${history.length}`);
history.forEach((entry, i) => {
  console.log(`${i + 1}. ${entry.method} at ${entry.timestamp}`);
});

await stagehand.close();
```

## History Entry Structure

```typescript
interface HistoryEntry {
  method: "act" | "extract" | "observe" | "navigate" | "agent";
  parameters: unknown;  // Input parameters
  result: unknown;      // Output/result
  timestamp: string;    // ISO 8601 timestamp
}
```

## Common Use Cases

### Debugging Failures

```typescript
try {
  await stagehand.act("click login button");
} catch (error) {
  const history = await stagehand.history;

  history.forEach((entry, i) => {
    const status = entry.result && 'error' in entry.result ? "FAILED" : "SUCCESS";
    console.log(`${i + 1}. ${status} - ${entry.method}`);
  });
}
```

### Analyzing Timing

```typescript
const history = await stagehand.history;

const timings = history.map((entry, i) => {
  if (i === 0) return null;
  const duration = new Date(entry.timestamp).getTime() -
                   new Date(history[i - 1].timestamp).getTime();
  return { operation: entry.method, duration };
}).filter(Boolean);

console.log("Slowest operations:",
  timings.sort((a, b) => b.duration - a.duration).slice(0, 3)
);
```

### Operation Statistics

```typescript
const history = await stagehand.history;

const stats = history.reduce((acc, entry) => {
  acc[entry.method] = (acc[entry.method] || 0) + 1;
  return acc;
}, {} as Record<string, number>);

console.log("Operations:", stats);
// { act: 5, extract: 2, observe: 3, navigate: 1 }
```

### Saving History

```typescript
import fs from "fs/promises";

const history = await stagehand.history;
const metrics = await stagehand.metrics;

await fs.writeFile(
  `workflow-report.json`,
  JSON.stringify({
    history,
    totalOps: history.length,
    totalTokens: metrics.totalPromptTokens + metrics.totalCompletionTokens
  }, null, 2)
);
```

## Filtering by Operation Type

```typescript
const history = await stagehand.history;

const actions = history.filter(e => e.method === 'act');
const extractions = history.filter(e => e.method === 'extract');
const agentOps = history.filter(e => e.method === 'agent');

console.log(`Actions: ${actions.length}`);
console.log(`Extractions: ${extractions.length}`);
console.log(`Agent executions: ${agentOps.length}`);
```

## Combining with Metrics

```typescript
const history = await stagehand.history;
const metrics = await stagehand.metrics;

const report = {
  totalOps: history.length,
  successful: history.filter(e => !e.result || !('error' in e.result)).length,
  failed: history.filter(e => e.result && 'error' in e.result).length,
  totalTokens: metrics.totalPromptTokens + metrics.totalCompletionTokens,
  avgTimePerOp: `${(metrics.totalInferenceTimeMs / history.length).toFixed(0)}ms`
};

console.log(report);
```

<Card title="Observability Guide" icon="chart-line" href="/configuration/observability">
  Learn more about metrics, logging, and monitoring
</Card>

## What's Tracked?

Only Stagehand methods are tracked in history:

```typescript
// Tracked
await stagehand.act("click button");              // ✓
await stagehand.extract({ instruction: "..." }); // ✓
await stagehand.observe("find elements");         // ✓
await page.goto("https://example.com");      // ✓

// Not tracked
await page.locator("button").click();        // ✗ Native Playwright
await page.click("button");                  // ✗ Native Playwright
```

## Best Practices

- **Save history for critical workflows** - Maintain audit trails for production
- **Inspect history when debugging** - Check the last operations to identify failures
- **Analyze timing periodically** - Find slow operations and optimize
- **Combine with metrics** - Get complete visibility into performance and cost

## Next Steps

<CardGroup cols={2}>
  <Card title="Deterministic Agent" icon="robot" href="/best-practices/deterministic-agent">
    Build fast, cached agent workflows
  </Card>

  <Card title="Observability" icon="chart-line" href="/configuration/observability">
    Combine history with metrics
  </Card>

  <Card title="Caching" icon="database" href="/best-practices/caching">
    Speed up workflows with caching
  </Card>

  <Card title="Logging" icon="file-lines" href="/configuration/logging">
    Configure detailed execution traces
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/best-practices/mcp-integrations.mdx
================================================
---
title: "MCP Integrations"
description: "Using Model Context Protocol (MCP) integrations to enhance agent capabilities"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## What are MCP Integrations?

MCP (Model Context Protocol) integrations allow you to connect your Stagehand agents to external tools, APIs, and services. This enables agents to perform actions beyond browser automation, such as web search, database operations, and API calls.

<Info>
MCP integrations make your agents more powerful by combining browser automation with external capabilities. The agent can intelligently decide when to use browser actions versus external tools.
</Info>

## Connection Options

There are two options for connecting to MCP servers:

1. **Pass a URL directly** - The simplest approach for quick setup
2. **Create a connection first** - Gives you more control over the connection

<Note>
MCP client support is currently only available in TypeScript.
</Note>

## Passing a URL

The simplest way to add MCP integrations is by providing server URLs directly in the agent configuration:

```typescript
const agent = stagehand.agent({
  provider: "openai",
  model: "computer-use-preview",
  integrations: [
    `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
  ],
  systemPrompt: `You have access to web search through Exa. Use it to find current information before browsing.`,
  options: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});

await agent.execute("Search for the best headphones of 2025 and go through checkout for the top recommendation");
```

## Creating a Connection First

Alternatively, you can establish MCP connections first and then pass the client objects:

```typescript
import { connectToMCPServer } from "@browserbasehq/stagehand";

// Connect to MCP server
const supabaseClient = await connectToMCPServer(
  `https://server.smithery.ai/@supabase-community/supabase-mcp/mcp?api_key=${process.env.SMITHERY_API_KEY}`
);

// You can also pass the config to start a local MCP server
const notionClient = await connectToMCPServer({
  command: "npx",
  args: ["-y", "@notionhq/notion-mcp-server"],
  env: {
    NOTION_TOKEN: process.env.NOTION_TOKEN,
  },
});

// Use the connected clients (example with Supabase + Notion)
const agent = stagehand.agent({
  provider: "openai", 
  model: "computer-use-preview",
  integrations: [supabaseClient, notionClient],
  systemPrompt: `You can interact with Supabase databases and Notion. Use these tools to store and retrieve data.`,
  options: {
    apiKey: process.env.OPENAI_API_KEY,
  },
});

await agent.execute("Search for restaurants in New Brunswick, NJ and save the first result to the database");
```

## Authenticated MCP Servers

Some MCP servers require authentication via HTTP request headers. You can pass request headers through `requestOptions`:

```typescript
const authenticatedClient = await connectToMCPServer({
  serverUrl: "https://mcp-server.example.com/mcp",
  requestOptions: {
    requestInit: {
      headers: {
        Authorization: `Bearer ${process.env.MCP_SERVER_API_KEY}`,
      },
    },
  },
});
```


## Multiple Integrations

You can combine multiple MCP integrations in a single agent:

```typescript
const databaseClient = await connectToMCPServer(/* database config */);

const agent = stagehand.agent({
  integrations: [
    `https://search-service.example.com/mcp?apiKey=${process.env.SEARCH_API_KEY}`,
    databaseClient
  ],
  systemPrompt: `You have access to external tools for search and data storage. Use these tools strategically to complete tasks efficiently.`
});
```

## Best Practices

### Choose the Right Connection Approach
<Tabs>
<Tab title="Passing a URL">
**When to use:**
- Simple setup requirements
- Standard API configurations
- Getting started quickly

**Benefits:**
- Minimal code required
- Automatic connection handling
- Easy to configure
</Tab>

<Tab title="Creating a Connection First">
**When to use:**
- Custom connection options
- Connection reuse across agents
- Advanced error handling

**Benefits:**
- Full control over connections
- Better error handling
- Connection pooling capabilities
</Tab>
</Tabs>

### Environment Variables

Always use environment variables for API keys and sensitive information:

```bash
# .env file
SEARCH_API_KEY=your_search_service_key
MCP_SERVICE_API_KEY=your_mcp_service_key
OPENAI_API_KEY=your_openai_key
DATABASE_URL=your_database_url
DATABASE_API_KEY=your_database_key
```

### Instructions Best Practices

Provide clear instructions about available tools:

<Tabs>
<Tab title="Good Instructions">
```typescript
systemPrompt: `You have access to:
1. Web search tools - Use to find current information
2. Database tools - Use to store/retrieve data
3. Browser automation - Use for web interactions

Always search for current information before making decisions.
Store important data for later reference.`
```
</Tab>

<Tab title="Poor Instructions">
```typescript
systemPrompt: "You can search and save data."
```
</Tab>
</Tabs>

### Error Handling

Implement proper error handling for MCP connections:

```typescript
try {
  const client = await connectToMCPServer(serverUrl);
  
  const agent = stagehand.agent({
    integrations: [client],
    // ... other config
  });
  
  const result = await agent.execute(instruction);
} catch (error) {
  console.error("MCP integration failed:", error);
  // Handle fallback behavior
}
```

## Troubleshooting

<AccordionGroup>
<Accordion title="Connection timeouts">
**Problem:** MCP server connections timing out

**Solutions:**
- Verify server URLs are correct and accessible
- Check network connectivity
- Ensure API keys are valid and have proper permissions
- Try connecting to servers individually to isolate issues
</Accordion>

<Accordion title="Tool not being used">
**Problem:** Agent not using available MCP tools

**Solutions:**
- Make instructions more specific about when to use tools
- Ensure API keys are properly configured
- Check that the MCP server supports the expected tools
- Verify tool descriptions are clear and actionable
</Accordion>

<Accordion title="Authentication errors">
**Problem:** API key or authentication failures

**Solutions:**
- Verify all required environment variables are set
- Check API key validity and permissions  
- Ensure URLs include necessary authentication parameters
- Test MCP connections independently before using in agents
</Accordion>
</AccordionGroup>

## Examples

### Web Search + Browser Automation
```typescript
const agent = stagehand.agent({
  integrations: [`https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`],
  systemPrompt: `First search for current information, then use the browser to complete tasks based on what you find.`
});

await agent.execute("Find the best laptop deals for 2025 and navigate to purchase the top recommendation");
```

### Data Extraction + Storage
```typescript
const supabaseClient = await connectToMCPServer(/* config */);

const agent = stagehand.agent({
  integrations: [supabaseClient],
  systemPrompt: `Extract data from websites and store it using available database tools.`
});

await agent.execute("Extract all restaurant information from this directory and save it to the database");
```

### Multi-tool Workflow
```typescript
const agent = stagehand.agent({
  integrations: [
    `https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`,
    supabaseClient
  ],
  systemPrompt: `Use all available tools strategically: search for current info, browse websites, and store important data.`
});

await agent.execute("Research competitor pricing, compare with our site, and store the analysis");
```

## Further Reading

<CardGroup cols={3}>
<Card title="Agent Basics" icon="robot" href="/basics/agent">
  Learn the fundamentals of Stagehand agents
</Card>

<Card title="MCP Server Setup" icon="server" href="/v3/integrations/mcp/setup">  
  Set up your own MCP server
</Card>

<Card title="Custom Tools" icon="wrench" href="/v3/integrations/mcp/tools">
  Create custom MCP tools
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/best-practices/prompting-best-practices.mdx
================================================
---
title: Prompting Best Practices
description: "Write effective prompts for reliable Stagehand automation"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Good prompts make Stagehand reliable. Bad prompts cause failures. Here's how to write prompts that work consistently.

## Act Method

Use `act()` for single actions on web pages. Each action should be focused and clear.

```typescript
// Good - Single, specific actions
await stagehand.act("click the 'Add to Cart' button");
await stagehand.act("type 'user@example.com' into the email field");

// Bad - Multiple actions combined
await stagehand.act("fill out the form and submit it");
await stagehand.act("login with credentials and navigate to dashboard");
```

### Use Element Types, Not Colors

Describe elements by their type and function rather than visual attributes like color.

```typescript
// Good - Element types and descriptive text
await stagehand.act("click the 'Sign In' button");
await stagehand.act("type into the email input field");

// Bad - Color-based descriptions
await stagehand.act("click the blue button");
await stagehand.act("type into the white input");
```

### Use Descriptive Language

```typescript
// Good - Clear element identification
await stagehand.act("click the 'Next' button at the bottom of the form");
await stagehand.act("type into the search bar at the top of the page");

// Bad - Vague descriptions
await stagehand.act("click next");
await stagehand.act("type into search");
```

### Choose the Right Action Verbs

- **Click** for buttons, links, checkboxes
- **Type** for text inputs
- **Select** for dropdowns
- **Check/uncheck** for checkboxes
- **Upload** for file inputs

```typescript
// Good
await stagehand.act("click the submit button");
await stagehand.act("select 'Option 1' from dropdown");

// Bad
await stagehand.act("click submit");
await stagehand.act("choose option 1");
```

### Protect Sensitive Data

Variables keep sensitive information out of prompts and logs.

```typescript
// Use variables for sensitive data
await stagehand.act("type %username% into the email field", {
  variables: { username: "user@example.com" }
});

await stagehand.act("type %password% into the password field", {
  variables: { password: process.env.USER_PASSWORD }
});
```

<Warning>
Set `verbose: 0` in your Stagehand config to prevent secrets from appearing in logs.
</Warning>

## Extract Method

Use `extract()` to pull structured data from pages. Define clear schemas and provide context.

### Schema Best Practices

Use descriptive field names, correct types, and detailed descriptions. Field descriptions provide context that helps the model understand exactly what to extract.

```typescript
// Good - Descriptive names, correct types, and helpful descriptions
const productData = await stagehand.extract(
  "Extract product information",
  z.object({
    productTitle: z.string().describe("The main product name displayed on the page"),
    priceInDollars: z.number().describe("Current selling price as a number, without currency symbol"),
    isInStock: z.boolean().describe("Whether the product is available for purchase")
  })
);

// Bad - Generic names, wrong types, no descriptions
const data = await stagehand.extract(
  "Get product details",
  z.object({
    name: z.string(), // Too generic, no context
    price: z.string(), // Should be number
    stock: z.string() // Should be boolean, no context
  })
);
```

### Use Proper URL Types

Specify URL types with `z.string().url()` to tell Stagehand to extract URLs.

```typescript
// Good - Tells Stagehand to extract URLs
const links = await stagehand.extract(
  "Extract navigation links",
  z.array(z.object({
    text: z.string(),
    url: z.string().url() // Required for URL extraction
  }))
);

// Single URL extraction
const contactUrl = await stagehand.extract(
  "extract the contact page URL",
  z.string().url()
);
```

## Observe Method

Use `observe()` to discover actionable elements before acting on them.

### Check Elements First

Verify elements exist before taking action to avoid errors.

```typescript
// Check for elements first
const loginButtons = await stagehand.observe("Find the login button");

if (loginButtons.length > 0) {
  await stagehand.act(loginButtons[0]);
} else {
  console.log("No login button found");
}
```

### Be Specific About Element Types

```typescript
// Good - Specific element types
const submitButtons = await stagehand.observe("Find submit button in the form");
const dropdowns = await stagehand.observe("Find the state dropdown menu");

// Bad - Too vague
const elements = await stagehand.observe("Find submit stuff");
const things = await stagehand.observe("Find state selection");
```

## Agent Method

Use `agent()` for complex, multi-step workflows. Provide detailed instructions and set appropriate limits.

### Navigate First

Don't include navigation in agent tasks. Handle it separately.

```typescript
// Good - Navigate first
await page.goto('https://amazon.com');
await agent.execute('Search for wireless headphones under $100 and add the best rated one to cart');

// Bad - Navigation in task
await agent.execute('Go to Amazon, search for headphones, and add one to cart');
```

### Be Highly Specific

Detailed instructions lead to better results.

```typescript
// Good - Detailed instructions
await agent.execute({
  instruction: "Find Italian restaurants in Brooklyn that are open after 10pm, have outdoor seating, and are rated 4+ stars. Save the top 3 results.",
  maxSteps: 25
});

// Bad - Vague instructions
await agent.execute("Find some good restaurants");
```

### Set Appropriate Step Limits

Match step limits to task complexity.

```typescript
// Simple task - fewer steps
await agent.execute({
  instruction: "Subscribe to the newsletter with email 'user@example.com'",
  maxSteps: 10
});

// Complex task - more steps  
await agent.execute({
  instruction: "Research and compare 5 project management tools with pricing and features",
  maxSteps: 50
});
```

### Include Success Criteria

Tell the agent how to know when it's done.

```typescript
// Good - Clear success criteria
await agent.execute({
  instruction: "Add 3 smartphone cases to cart and confirm the cart shows exactly 3 items with total price",
  maxSteps: 20
});

// Bad - No validation
await agent.execute("Add some items to cart");
```

## Common Mistakes to Avoid

- **Combining multiple actions** - Keep each `act()` call to one action
- **Using vague descriptions** - Be specific about which elements to interact with  
- **Exposing sensitive data** - Always use variables for credentials
- **Skipping validation** - Check results before proceeding

## Testing Your Prompts

1. **Start simple** - Test basic functionality first
2. **Add complexity gradually** - Build up to complex workflows
3. **Monitor results** - Use logging to understand what's happening
4. **Iterate based on failures** - Refine prompts when they don't work
Remember: Good prompting is iterative. When in doubt, be more specific rather than less.

================================================
FILE: packages/docs/v3/best-practices/speed-optimization.mdx
================================================
---
title: Speed Optimization
sidebarTitle: Speed Optimization
description: Optimize Stagehand performance for faster automation and reduced latency
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Stagehand performance depends on several factors: DOM processing speed, LLM inference time, browser operations, and network latency. This guide provides proven strategies to maximize automation speed.

## Quick Performance Wins

### 1. Plan Ahead with Observe


Use a single `observe()` call to plan multiple actions, then execute them efficiently:

```typescript
// Instead of sequential operations with multiple LLM calls
await stagehand.act("Fill name field");        // LLM call #1
await stagehand.act("Fill email field");       // LLM call #2
await stagehand.act("Select country dropdown"); // LLM call #3

// Use single observe to plan all form fields - one LLM call
const formFields = await stagehand.observe("Find all form fields to fill");

// Execute all actions without LLM inference
for (const field of formFields) {
  await stagehand.act(field); // No LLM calls!
}
```

<Note>
**Performance Tip**: Acting on `observe` results avoids LLM inference entirely. This approach is 2-3x faster than direct `act()` calls and is the recommended pattern for multi-step workflows.
</Note>

<Card title="Caching Guide" icon="database" href="/best-practices/caching">
  Learn advanced caching patterns and cache invalidation strategies
</Card>

### 2. Optimize DOM Processing

Reduce DOM complexity before Stagehand processes the page:

```typescript
// Remove heavy elements that slow down processing
await page.evaluate(() => {
  // Remove video elements
  document.querySelectorAll('video, iframe').forEach(el => el.remove());
  
  // Hide complex animations
  document.querySelectorAll('[style*="animation"]').forEach(el => {
    (el as HTMLElement).style.animation = 'none';
  });
});

// Then perform Stagehand operations
await stagehand.act("Click the submit button");
```

### 3. Set Appropriate Timeouts

Use shorter timeouts for simple operations and longer ones for complex page loads:

```typescript
// Simple actions - reduce action timeout
await stagehand.act("Click the login button", {
  timeout: 5000  // Default is 30000ms, reduce for simple clicks
});

// Complex page loads - optimize navigation
const page = stagehand.context.pages()[0];
await page.goto("https://heavy-spa.com", {
  waitUntil: "domcontentloaded", // Don't wait for all resources
  timeout: 15000 // Shorter than default 30s
});
```

## Performance Monitoring and Benchmarking

Track performance metrics and measure optimization impact:

### Performance Tracking

```typescript
class PerformanceTracker {
  private speedMetrics: Map<string, number[]> = new Map();

  async timedAct(page: Page, prompt: string): Promise<ActResult> {
    const start = Date.now();
    const result = await stagehand.act(prompt);
    const duration = Date.now() - start;
    
    if (!this.speedMetrics.has(prompt)) {
      this.speedMetrics.set(prompt, []);
    }
    this.speedMetrics.get(prompt)!.push(duration);
    
    console.log(`Action "${prompt}" took ${duration}ms`);
    return result;
  }

  getAverageTime(prompt: string): number {
    const times = this.speedMetrics.get(prompt) || [];
    return times.reduce((a, b) => a + b, 0) / times.length;
  }
}
```

Example Output:
```
Action "Fill form" took 1000ms
Action "Click submit" took 2000ms
Action "Confirm submission" took 5000ms
```

### Before vs After Benchmarking

```typescript
// Before optimization
console.time("workflow");
await stagehand.act("Fill form");
await stagehand.act("Click submit");
await stagehand.act("Confirm submission");
console.timeEnd("workflow"); // 8000ms

// After optimization with observe planning
console.time("workflow-optimized");
const workflowActions = await stagehand.observe("Find form, submit, and confirm elements");

// Execute actions sequentially to avoid conflicts
for (const action of workflowActions) {
  await stagehand.act(action);
}
console.timeEnd("workflow-optimized"); // 500ms
```

Example Output:
```
Workflow took 8000ms
Optimized workflow took 500ms
```

<CardGroup cols={1}>
<Card title="Observability & Metrics" icon="chart-line" href="/configuration/observability">
  Set up comprehensive performance monitoring
</Card>
</CardGroup>


## Related Resources

<CardGroup cols={2}>
<Card title="Caching Strategies" icon="database" href="/best-practices/caching">
  Advanced caching patterns for maximum performance
</Card>

<Card title="Cost Optimization" icon="dollar-sign" href="/best-practices/cost-optimization">
  Balance speed improvements with cost considerations
</Card>

<Card title="Browser Configuration" icon="window-maximize" href="/configuration/browser">
  Optimize Browserbase settings for speed
</Card>

<Card title="Model Selection" icon="brain" href="/configuration/models">
  Choose the right model for speed vs accuracy
</Card>
</CardGroup>

================================================
FILE: packages/docs/v3/best-practices/usecase-observe.mdx
================================================
---
sidebarTitle: Use Cases
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Real-World Use Cases

### E-commerce Product Discovery

```typescript
// Discover product interaction elements
const productActions = await stagehand.observe({
  instruction: "Find add to cart buttons, size selectors, and product images"
});

// Categorize actions by type
const cartButtons = productActions.filter(a => 
  a.description.toLowerCase().includes('cart')
);
const sizeOptions = productActions.filter(a => 
  a.description.toLowerCase().includes('size')
);

// Execute purchase workflow
if (sizeOptions.length > 0) {
  await stagehand.act(sizeOptions[0]); // Select size first
}
if (cartButtons.length > 0) {
  await stagehand.act(cartButtons[0]); // Then add to cart
}
```

### Form Handling & Validation

```typescript
// Analyze form structure before filling
const formElements = await stagehand.observe({
  instruction: "Find form fields, validation messages, and submit buttons"
});

// Check for required fields
const requiredFields = formElements.filter(e => 
  e.description.includes('required') || e.description.includes('*')
);

console.log(`Found ${requiredFields.length} required fields to complete`);

// Fill form systematically
for (const field of requiredFields) {
  await stagehand.act(field);
  // Add appropriate input based on field type
}
```

### Dynamic Content & SPA Navigation

```typescript
// Wait for and discover dynamically loaded content
await page.waitForLoadState('networkidle');

const dynamicElements = await stagehand.observe({
  instruction: "Find newly loaded content, infinite scroll triggers, or loading indicators",
  domSettleTimeoutMs: 15000 // Wait longer for dynamic content
});

// Handle infinite scroll
const scrollTriggers = dynamicElements.filter(e => 
  e.description.toLowerCase().includes('load more') ||
  e.description.toLowerCase().includes('scroll')
);

if (scrollTriggers.length > 0) {
  await stagehand.act(scrollTriggers[0]);
  // Recursively observe new content
  const newContent = await stagehand.observe("Find additional items");
}
```

### Multi-Step Workflow Planning

```typescript
// Plan entire checkout flow upfront
async function planCheckoutWorkflow() {
  // Step 1: Cart page analysis
  await page.goto('/cart');
  const cartActions = await stagehand.observe("Find checkout and cart modification options");
  
  // Step 2: Checkout page analysis  
  const checkoutButton = cartActions.find(a => a.description.includes('checkout'));
  if (checkoutButton) await stagehand.act(checkoutButton);
  
  const checkoutActions = await stagehand.observe("Find payment forms and shipping options");
  
  // Step 3: Plan execution order
  const shippingFields = checkoutActions.filter(a => a.description.includes('shipping'));
  const paymentFields = checkoutActions.filter(a => a.description.includes('payment'));
  const submitButton = checkoutActions.find(a => a.description.includes('complete order'));
  
  return { shippingFields, paymentFields, submitButton };
}

// Execute planned workflow
const workflow = await planCheckoutWorkflow();
// Fill shipping → payment → submit
```


================================================
FILE: packages/docs/v3/best-practices/user-data.mdx
================================================
---
title: User Data Directory
sidebarTitle: User Data
description: Persist browser data between sessions
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />

### User Data Directory

Persist browser data between sessions.

#### Local Sessions

For local sessions, use the `userDataDir` option:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    userDataDir: "./browser-data",
  },
});

await stagehand.init();
```

#### Browserbase Sessions

For Browserbase sessions, use [contexts](https://docs.browserbase.com/features/contexts) to persist browser data:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionCreateParams: {
    browserSettings: {
      context: {
        id: "my-context-id",
        persist: true,
      },
    },
  },
});

await stagehand.init();
console.log("Session ID:", stagehand.sessionId);
```

================================================
FILE: packages/docs/v3/best-practices/using-multiple-tabs.mdx
================================================
---
title: 'Using Multiple Tabs'
description: 'Act on multiple tabs with Stagehand'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Many modern web applications open new tabs when users click certain buttons or links. Without proper multitab support, automation scripts break when expected content appears in a new tab rather than the current one. Stagehand's multitab capabilities ensure your automations work seamlessly across multitab workflows.

## The Stagehand Page

Stagehand automatically adapts to multitab workflows. The active page (accessed via `context.activePage()`) always points to the most recently opened or active tab, ensuring your automations continue working even when new tabs are created.

This means you can continue using familiar patterns:

```typescript
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");
await stagehand.act("click the button that opens a new tab");
// page now automatically points to the new tab
await stagehand.extract("get data from new tab");
```

<Warning>
**Important**: [Stagehand Agent](/v3/basics/agent) will always operate on the active page. If you need an agent to work across specific tabs, you'll need to manage page switching manually.
</Warning>

## Manual Page Management

For more control or multitab workflows, you can manage multiple tabs explicitly:

```typescript
// Create a second page
await stagehand.context.newPage();
const pages = stagehand.context.pages();

const githubPage = pages[0];
const pythonPage = pages[1];

// Navigate each page to different repositories
await githubPage.goto("https://github.com/browserbase/stagehand");
await pythonPage.goto("https://github.com/browserbase/stagehand-python");

// Extract data from both pages simultaneously
const [stagehandStars, stagehandPythonStars] = await Promise.all([
  stagehand.extract("extract the repository stars", { page: githubPage }),
  stagehand.extract("extract the repository stars", { page: pythonPage })
]);

console.log(`Stagehand stars: ${stagehandStars}`);
console.log(`Stagehand-Python stars: ${stagehandPythonStars}`);
```

## Next Steps

<CardGroup cols={2}>
  <Card title="Orchestrate complex workflows with Agent" icon="robot" iconType="sharp-solid" href="/v3/basics/agent">
    Use `Agent` to autonomously execute multi-step tasks and complex workflows.
  </Card>

  <Card title="Working with iframes" icon="frame" iconType="sharp-solid" href="/v3/best-practices/working-with-iframes">
    Learn best practices for interacting with elements inside iframes.
  </Card>

  <Card title="Browser Configuration" icon="browser" iconType="sharp-solid" href="/v3/configuration/browser">
    Manage browser contexts and sessions for complex automation scenarios.
  </Card>

  <Card title="Logging & Debugging" icon="bug" iconType="sharp-solid" href="/v3/configuration/logging">
    Handle errors gracefully and debug automation issues effectively.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v3/configuration/browser.mdx
================================================
---
title: Browser
sidebarTitle: Browser
description: Configure Stagehand on Browserbase or locally
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Stagehand supports two primary environments:

- **Browserbase** - Cloud-managed browser infrastructure optimized for production web automation at scale
- **Local** - Run browsers directly on your machine for development and debugging

## Browserbase Environment

Browserbase provides managed cloud browser infrastructure optimized for web automation at scale. It offers advanced features like stealth mode, proxy support, and persistent contexts.

<Card icon="cloud" title="Browserbase" href="https://docs.browserbase.com" description="Explore the features and benefits of using Browserbase for scalable web automation.">
  Discover the power of cloud-managed browser infrastructure with Browserbase.
</Card>

### Multi-Region Support

Stagehand API is available in multiple regions to optimize latency and support data residency requirements. The SDK automatically routes requests to the correct regional API endpoint based on your browser session's region.

| Region | API Endpoint |
| --- | --- |
| **us-west-2** (Default) | https://api.stagehand.browserbase.com |
| **us-east-1** | https://api.use1.stagehand.browserbase.com |
| **eu-central-1** | https://api.euc1.stagehand.browserbase.com |
| **ap-southeast-1** | https://api.apse1.stagehand.browserbase.com |

Configure your browser session region in `browserbaseSessionCreateParams`:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionCreateParams: {
    region: "eu-central-1", // Browser runs in Frankfurt
  },
});

await stagehand.init();
```

<Warning>
The API endpoint must match your browser session region. If there's a mismatch, you'll receive an error:
`Session is in region 'X' but this API instance serves 'Y'. Please route your request to the X Stagehand API endpoint.`
</Warning>

### Disabling Stagehand API

If you want to use Stagehand purely as a local library without routing through the Stagehand API, you can disable API mode:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  disableAPI: true, // Disable Stagehand API - runs locally with Browserbase
});

await stagehand.init();
```

<Tip>
Disabling the API is useful when you want to manage browser sessions directly while still using Stagehand's automation features locally.
</Tip>

### Environment Variables

Before getting started, set up the required environment variables:

<CodeGroup>
```bash .env
BROWSERBASE_API_KEY=your_api_key_here
BROWSERBASE_PROJECT_ID=your_project_id_here
```
</CodeGroup>

<Tip>
Get your API key and Project ID from the [Browserbase Dashboard](https://browserbase.com/overview)
</Tip>

### Using Stagehand with Browserbase

#### Basic Setup

The simplest way to get started is with default settings:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
});

await stagehand.init();
```

#### Advanced Configuration

Configure browser settings, proxy support, and other session parameters:
```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  // Optional: API Key and Project ID will be pulled directly from your environment
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  browserbaseSessionCreateParams: {
    proxies: true,
    region: "us-west-2",
    browserSettings: {
      viewport: { width: 1920, height: 1080 },
      blockAds: true,
    },
  },
});

await stagehand.init();
console.log("Session ID:", stagehand.sessionId);
```

<Accordion title="Advanced Browserbase Configuration Example">
    ```typescript
const stagehand = new Stagehand({
      env: "BROWSERBASE",
      apiKey: process.env.BROWSERBASE_API_KEY,
      projectId: process.env.BROWSERBASE_PROJECT_ID,
      browserbaseSessionCreateParams: {
        projectId: process.env.BROWSERBASE_PROJECT_ID!,
        proxies: true,
        region: "us-west-2",
        timeout: 3600, // 1 hour session timeout
        keepAlive: true, // Available on Startup plan
        browserSettings: {
          advancedStealth: false, // this is a Scale Plan feature - reach out to support@browserbase.com to enable
          blockAds: true,
          solveCaptchas: true,
          recordSession: false,
          viewport: {
            width: 1920,
            height: 1080,
          },
        },
        userMetadata: {
          userId: "automation-user-123",
          environment: "production",
        },
      },
    });
    ```
</Accordion>

### Alternative: Browserbase SDK

If you prefer to manage sessions directly, you can use the Browserbase SDK:

```typescript
import { Browserbase } from "@browserbasehq/sdk";

const bb = new Browserbase({ 
  apiKey: process.env.BROWSERBASE_API_KEY! 
});

const session = await bb.sessions.create({
  projectId: process.env.BROWSERBASE_PROJECT_ID!,
  // Add configuration options here
});
```

#### Connecting to an Existing Session

Connect to a previously created Browserbase session using its session ID:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionID: "existing-session-uuid-here",
});

await stagehand.init();
console.log("Resumed Session ID:", stagehand.sessionId);
```

## Local Environment

The local environment runs browsers directly on your machine, providing full control over browser instances and configurations. Ideal for development, debugging, and scenarios requiring custom browser setups.

### Environment Comparison

| Feature | Browserbase | Local |
| --- | --- | --- |
| **Scalability** | High (cloud-managed) | Limited (local resources) |
| **Stealth Features** | Advanced fingerprinting | Basic stealth |
| **Proxy Support** | Built-in residential proxies | Manual configuration |
| **Session Persistence** | Cloud context storage | File-based user data |
| **Geographic Distribution** | Multi-region deployment | Single machine |
| **Debugging** | Session recordings & logs | Direct DevTools access |
| **Setup Complexity** | Environment variables only | Browser installation required |
| **Cost** | Usage-based pricing | Infrastructure & maintenance |
| **Best For** | Production, scale, compliance | Development, debugging |

### Basic Local Setup

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL"
});
  
await stagehand.init();
console.log("Session ID:", stagehand.sessionId);
```

### Advanced Local Configuration

Customize browser launch options for local development:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    headless: false, // Show browser window
    devtools: true, // Open developer tools
    viewport: { width: 1280, height: 720 },
    executablePath: '/opt/google/chrome/chrome', // Custom Chrome path
    port: 9222, // Fixed CDP debugging port
    args: [
      '--no-sandbox',
      '--disable-setuid-sandbox',
      '--disable-web-security',
      '--allow-running-insecure-content',
    ],
    userDataDir: './chrome-user-data', // Persist browser data
    preserveUserDataDir: true, // Keep data after closing
    chromiumSandbox: false, // Disable sandbox (adds --no-sandbox)
    ignoreHTTPSErrors: true, // Ignore certificate errors
    locale: 'en-US', // Set browser language
    deviceScaleFactor: 1.0, // Display scaling
    proxy: {
      server: 'http://proxy.example.com:8080',
      username: 'user',
      password: 'pass'
    },
    downloadsPath: './downloads', // Download directory
    acceptDownloads: true, // Allow downloads
    connectTimeoutMs: 30000, // Connection timeout
  },
});

await stagehand.init();
```

## Advanced Configuration

### Keep Alive

The `keepAlive` option controls whether the browser remains running after `stagehand.close()` is called or when the parent process exits unexpectedly (e.g., crash, `SIGTERM`, `SIGINT`).

By default, Stagehand terminates the browser and cleans up all resources when it shuts down. Setting `keepAlive: true` keeps the browser running independently so you can reconnect to it later.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  keepAlive: true,
});

await stagehand.init();

// The browser session continues running after close()
await stagehand.close();

// Later, reconnect to the same session
const stagehand2 = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionID: stagehand.browserbaseSessionID,
});
await stagehand2.init();
```

#### Behavior by Environment

| Behavior | `keepAlive: true` | `keepAlive: false` (default) |
| --- | --- | --- |
| **Browserbase** | Session stays active after `close()` | Session is terminated via API |
| **Local** | Chrome process continues running | Chrome process is killed and temp profile is removed |
| **On crash/signal** | Browser is left running | Browser is automatically cleaned up |

#### Local Environment

When running locally with `keepAlive: true`, the Chrome process is detached from the Node.js event loop, allowing your script to exit while the browser stays open. This is useful for debugging or for handing off a browser session to another process.

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  keepAlive: true,
  localBrowserLaunchOptions: {
    headless: false,
  },
});

await stagehand.init();
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

// Browser window stays open after the script exits
await stagehand.close();
```

#### Browserbase Environment

On Browserbase, `keepAlive: true` keeps the cloud session active so you can reconnect later using `browserbaseSessionID`. This is useful for long-running workflows that span multiple script executions.

<Note>
The top-level `keepAlive` option overrides `browserbaseSessionCreateParams.keepAlive` when both are provided.
</Note>

### Fixed CDP Debugging Port

Specify a fixed Chrome DevTools Protocol (CDP) debugging port instead of using a randomly assigned one.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  localBrowserLaunchOptions: {
    port: 9222,
  },
});

await stagehand.init();
```

<Tip>
If no `port` is specified, a random port will be assigned.
</Tip>

### DOM Settle Timeout

Configure how long Stagehand waits for the DOM to stabilize before taking actions.

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  domSettleTimeout: 3000 // Wait up to 3 seconds for DOM to settle
});
```

#### What is DOM Settling?

DOM settling ensures that:
- **Animations complete** before interacting with elements
- **Lazy-loaded content** has time to appear
- **JavaScript updates** finish before actions are taken
- **Dynamic content** is fully rendered

#### When to Adjust

Increase `domSettleTimeout` for pages with:
- Heavy animations or transitions
- Lazy-loading or infinite scroll
- Dynamic JavaScript frameworks (React, Vue, Angular)
- Complex single-page applications

```typescript
// For fast, static pages
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  domSettleTimeout: 500 // Minimal wait
});

// For dynamic, animated pages
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  domSettleTimeout: 5000 // Longer wait for stability
});
```

<Warning>
Setting `domSettleTimeout` too low may cause actions to fail on elements that aren't ready. Setting it too high increases execution time unnecessarily.
</Warning>

## Troubleshooting

<AccordionGroup>
<Accordion title="Browserbase Authentication Errors">
- Verify your `BROWSERBASE_API_KEY` and `BROWSERBASE_PROJECT_ID` are set correctly
- Check that your API key has the necessary permissions
- Ensure your Browserbase account has sufficient credits
</Accordion>

<Accordion title="Local Browser Launch Failures">
- Install Chrome or Chromium on your system
- Set the correct `executablePath` for your Chrome installation
- Check that required dependencies are installed (Linux: `libnss3-dev libatk-bridge2.0-dev libgtk-3-dev libxss1 libasound2`)
</Accordion>

<Accordion title="Session Timeout Issues">
- Increase session timeout in `browserbaseSessionCreateParams.timeout`
- Use `keepAlive: true` for long-running sessions
- Monitor session usage to avoid unexpected terminations
</Accordion>
</AccordionGroup>

================================================
FILE: packages/docs/v3/configuration/logging.mdx
================================================
---
title: Logging
sidebarTitle: Logging
description: Set up logging, debugging, and error tracking for Stagehand workflows
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Stagehand provides comprehensive logging capabilities to help you debug automation workflows, track execution, and diagnose issues. Configure logging levels, structured output, and debugging tools for both development and production environments.

## Quick Start

Choose your logging setup based on your environment:

<CodeGroup>
```typescript Development
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  verbose: 2,  // Full debug output
  // restOfYourConfiguration...
});
```

```typescript Production
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  verbose: 1,  // Standard logging - less noise
  disablePino: true,  // Disable default console logging - no console spam
  // logger: yourProductionLogger,  // Send to observability platform like Sentry or DataDog
  // restOfYourConfiguration...
});
```

```typescript Testing
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  verbose: 1,
  // Pino automatically disabled in test environments - no worker thread issues
  // logger: yourTestLogger,  // Send to test logging framework like Jest
  // restOfYourConfiguration...
});
```
</CodeGroup>

---

## Operational Logging

Real-time event logging during automation execution.

### Verbosity Level

Control how much detail you see in logs:

<Tabs>
<Tab title="Level 2: Debug">
**Use for:** Development, debugging specific issues

```typescript
const stagehand = new Stagehand({
  verbose: 2,  // Maximum detail
  // restOfYourConfiguration...
});
```

<Accordion title="Example Output">

```
[12:34:56] DEBUG: Capturing DOM snapshot
[12:34:57] DEBUG: DOM contains 847 elements
[12:34:58] DEBUG: LLM inference started
[12:34:59] DEBUG: LLM response: {"selector": "#btn-submit", "method": "click"}
[12:35:00] INFO: act completed successfully
```

</Accordion>
</Tab>

<Tab title="Level 1: Info (Default)">
**Use for:** Standard operations, staging, production

```typescript
const stagehand = new Stagehand({
  verbose: 1,  // Default level
  // restOfYourConfiguration...
});
```


<Accordion title="Example Output">

```
[12:34:56] INFO: act started
[12:35:00] INFO: act completed successfully
[12:35:01] INFO: extract started
[12:35:03] INFO: extract completed
```

</Accordion>
</Tab>

<Tab title="Level 0: Errors Only">
**Use for:** Production with external monitoring, minimal noise

```typescript
const stagehand = new Stagehand({
  verbose: 0,  // Errors only
  // restOfYourConfiguration...
});
```

<Accordion title="Example Output">

```
[12:35:05] ERROR: act failed: element not found
[12:35:10] ERROR: navigation timeout exceeded
```

</Accordion>
</Tab>
</Tabs>

---

### Log Destinations

Logs can be sent to different destinations, including your console and external observability platforms:

<Tabs>
<Tab title="Pino (Default)">
Fast, structured, colorized JSON logger with console output.

**When to use:** Development, staging, or production without external observability; can manage multiple Stagehand instances

```typescript
// Enabled by default - Pino handles console output automatically
const stagehand = new Stagehand({
  verbose: 1,
  // restOfYourConfiguration...
});
```

<Accordion title="Auto-disabled when">
- `process.env.NODE_ENV === "test"`
- `process.env.JEST_WORKER_ID !== undefined` (Jest tests)
- `process.env.PLAYWRIGHT_TEST_BASE_DIR !== undefined` (Playwright tests)
- `process.env.CI === "true"` (CI/CD environments)

**Why auto-disable?** Pino uses worker threads for pretty-printing, which can cause issues in test runners.
</Accordion>
</Tab>

<Tab title="Console Fallback">
Simple console.log/error output.

**When to use:** Automatically activated in tests, or when `disablePino: true` without setting an external logger

```typescript
const stagehand = new Stagehand({
  verbose: 1,
  disablePino: true, // Set to true automatically when a test is detected
  // restOfYourConfiguration...
});
```

<Accordion title="Auto-disabled when">
- `process.env.NODE_ENV === "test"`
- `process.env.JEST_WORKER_ID !== undefined` (Jest tests)
- `process.env.PLAYWRIGHT_TEST_BASE_DIR !== undefined` (Playwright tests)
- `process.env.CI === "true"` (CI/CD environments)

**Why auto-disable?** Pino uses worker threads for pretty-printing, which can cause issues in test runners.
</Accordion>
</Tab>
<Tab title="Custom Logger">
Your custom logging function to receive all logs. Works independently of Pino - receives logs regardless of Pino setting.

**When to use:** Development, debugging, or when you don't need querying
capabilities.

<Steps>

<Step title="Create a simple logger">
```typescript
// Simple logger without parsing (for basic console output)
const simpleLogger = (logLine: LogLine) => {
  console.log(`[${logLine.level}] ${logLine.message}`);

  // Optional: log raw auxiliary data
  if (logLine.auxiliary) {
    console.log('  Context:', logLine.auxiliary);
  }
};
```
</Step>

<Step title="Pass the logger in your Stagehand instance">
Then pass the logger in your Stagehand instance:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  verbose: 1,
  logger: simpleLogger,
  disablePino: true,  // Avoid duplicate processing
  // restOfYourConfiguration...
})
```

</Step>
</Steps>
</Tab>

<Tab title="External Logger (Production)">
Your custom logging function to receive all logs. Works independently of Pino - receives logs regardless of Pino setting.

**When to use:** Production with DataDog, Sentry, CloudWatch, or custom observability platforms for centralized monitoring and enable error alerting. Here's examples using Sentry and DataDog:

<Steps>

<Step title="Create a production logger">

<Tabs>

<Tab title="Sentry">

```typescript
import * as Sentry from "@sentry/node";

const productionLogger = (logLine: LogLine) => {
  // Send errors to Sentry
  if (logLine.level === 0) {
    Sentry.captureMessage(logLine.message, {
      level: 'error',
      extra: aux,
    });
  }
}

// Helper to parse auxiliary data to be flat, numeric, and filterable
function parseAuxiliary(aux?: LogLine['auxiliary']): Record<string, any> {
  if (!aux) return {};
  const parsed: Record<string, any> = {};
  for (const [key, entry] of Object.entries(aux)) {
    parsed[key] = entry.type === 'object'
      ? JSON.parse(entry.value)
      : entry.value;
  }
  return parsed;
}
```

</Tab>
<Tab title="DataDog">

```typescript
import { datadogLogs } from "@datadog/browser-logs";

const productionLogger = (logLine: LogLine) => {
  // Send all logs to DataDog
  datadogLogs.logger.log(logLine.message, {
    status: logLine.level === 0 ? 'error' : 'info',
    service: 'stagehand-automation',
    category: logLine.category,
    ...aux,
  });
}

// Helper to parse auxiliary data to be flat, numeric, and filterable
function parseAuxiliary(aux?: LogLine['auxiliary']): Record<string, any> {
  if (!aux) return {};
  const parsed: Record<string, any> = {};
  for (const [key, entry] of Object.entries(aux)) {
    parsed[key] = entry.type === 'object'
      ? JSON.parse(entry.value)
      : entry.value;
  }
  return parsed;
}
```
</Tab>
</Tabs>

</Step>

<Step title="Pass the logger in your Stagehand instance">

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  verbose: 1,
  logger: productionLogger,
  disablePino: true,  // Avoid duplicate processing
  // restOfYourConfiguration...
})
```

</Step>
</Steps>

</Tab>
</Tabs>

---

## File-Based Session Logging

Enable detailed file-based logging for all Stagehand operations by setting a config directory. This creates comprehensive logs for `agent.execute`, `act`, `observe`, `extract`, CDP events, and LLM requests/responses.

### Setup

Add to your shell configuration (`~/.zshrc`, `~/.bashrc`, etc.):

```bash
export BROWSERBASE_CONFIG_DIR=~/.config/browserbase
```

Then reload your shell or run `source ~/.zshrc`.

### Usage

Run your Stagehand script as normal:

```bash
tsx run_some_script_that_imports_stagehand.ts
```

Logs are written to `~/.config/browserbase/sessions/<session-id>/` with a `latest` symlink pointing to the most recent session.

### Viewing Logs

<Tabs>
<Tab title="Real-time Monitoring">
Follow all logs as they happen:

```bash
tail -f ~/.config/browserbase/sessions/latest/*.log
```

Or watch specific log types:

```bash
# LLM requests and responses only
tail -f ~/.config/browserbase/sessions/latest/llm_events.log

# CDP (Chrome DevTools Protocol) events only
tail -f ~/.config/browserbase/sessions/latest/cdp_events.log
```
</Tab>

<Tab title="Chronological Review">
View unified output sorted by timestamp:

```bash
cat ~/.config/browserbase/sessions/latest/*.log | sort
```
</Tab>

<Tab title="Historical Sessions">
Browse previous session logs:

```bash
ls ~/.config/browserbase/sessions/
# Output: 2025-01-06_14-30-45_abc123  2025-01-06_15-45-12_def456  latest

cat ~/.config/browserbase/sessions/2025-01-06_14-30-45_abc123/*.log | sort
```
</Tab>
</Tabs>

### Log Files

Each session directory contains:

| File | Contents |
|------|----------|
| `llm_events.log` | LLM requests and responses for act, extract, observe, and agent operations |
| `cdp_events.log` | Chrome DevTools Protocol calls and events |
| `stagehand.log` | General Stagehand operations and state changes |

<Note>
This is especially useful for debugging agent workflows where you need to trace the full sequence of LLM decisions, browser actions, and CDP interactions.
</Note>

---

## LLM Inference Debugging

<Warning>
**Development only** - Creates large files and contains page content. Do not use in production.
</Warning>

Save complete LLM request/response dumps to disk for offline analysis. See exactly what DOM was sent to the LLM and why it chose the wrong element.

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  verbose: 2,
  logInferenceToFile: true,  // Writes files to ./inference_summary/
});
```

Creates timestamped files for each LLM call:

```
./inference_summary/
├── act_summary/
│   ├── act_summary.json                      # Aggregate metrics
│   ├── 20250127_123456_act_call.txt          # LLM request
│   ├── 20250127_123456_act_response.txt      # LLM response
│   ├── 20250127_123501_act_call.txt
│   └── 20250127_123501_act_response.txt
├── extract_summary/
│   ├── extract_summary.json
│   ├── 20250127_123510_extract_call.txt
│   ├── 20250127_123510_extract_response.txt
│   ├── 20250127_123511_metadata_call.txt
│   └── 20250127_123511_metadata_response.txt
└── observe_summary/
    ├── observe_summary.json
    └── ...
```

**File Types:**

<AccordionGroup>
<Accordion title="Call File">
Contains the complete LLM request:

```json
{
  "modelCall": "act",
  "messages": [
    {
      "role": "system",
      "content": "You are a browser automation assistant. You have access to these actions:\n- click\n- type\n- scroll\n..."
    },
    {
      "role": "user",
      "content": "Click the sign in button\n\nDOM:\n<html>\n  <body>\n    <button id=\"btn-1\">Sign In</button>\n    <button id=\"btn-2\">Sign Up</button>\n  </body>\n</html>"
    }
  ]
}
```
</Accordion>

<Accordion title="Response File">
Contains the LLM output:

```json
{
  "modelResponse": "act",
  "rawResponse": {
    "selector": "#btn-1",
    "method": "click",
    "reasoning": "Found sign in button with ID btn-1"
  }
}
```
</Accordion>

<Accordion title="Summary File">
Aggregates all calls with metrics:

```json
{
  "act_summary": [
    {
      "act_inference_type": "act",
      "timestamp": "20250127_123456",
      "LLM_input_file": "20250127_123456_act_call.txt",
      "LLM_output_file": "20250127_123456_act_response.txt",
      "prompt_tokens": 3451,
      "completion_tokens": 45,
      "inference_time_ms": 951
    },
    {
      "act_inference_type": "act",
      "timestamp": "20250127_123501",
      "LLM_input_file": "20250127_123501_act_call.txt",
      "LLM_output_file": "20250127_123501_act_response.txt",
      "prompt_tokens": 2890,
      "completion_tokens": 38,
      "inference_time_ms": 823
    }
  ]
}
```
</Accordion>
</AccordionGroup>

---

## Reference

### Logging Configuration

All logging options are passed to the Stagehand constructor:

```typescript
const stagehand = new Stagehand({
  // ... your other configurations (env, model, etc.)

  // Logging options:
  verbose?: 0 | 1 | 2;                   // Log level (default: 1)
  logger?: (line: LogLine) => void;      // External logger function
  disablePino?: boolean;                 // Disable Pino backend (default: false)
  logInferenceToFile?: boolean;          // Save LLM requests to disk (default: false)
});
```

| Option | Default | Description |
|--------|---------|-------------|
| `verbose` | `1` | Log level: `0` = errors only, `1` = info, `2` = debug |
| `logger` | `undefined` | Custom logger function for external platforms |
| `disablePino` | `false` | Disable Pino (auto `true` in tests) |
| `logInferenceToFile` | `false` | Save LLM requests to disk (default: false) |

### Log Structure

Each log entry follows a structured format:

```typescript
interface LogLine {
  message: string;              // "act completed successfully"
  level?: 0 | 1 | 2;            // error | info | debug
  category?: string;            // "action", "llm", "browser", "cache"
  timestamp?: string;           // ISO 8601 timestamp
  auxiliary?: {                 // Additional structured metadata
    [key: string]: {
      value: string;             // Serialized value
      type: "object" | "string" | "integer" | "float" | "boolean";
    };
  };
}
```

<Accordion title="Log Examples">

<Tabs>
<Tab title="Successful Action">
```json
{
  "category": "action",
  "message": "act completed successfully",
  "level": 1,
  "timestamp": "2025-01-27T12:35:00.123Z",
  "auxiliary": {
    "selector": {
      "value": "#btn-submit",
      "type": "string"
    },
    "executionTime": {
      "value": "1250",
      "type": "integer"
    }
  }
}
```
</Tab>

<Tab title="LLM Inference">
```json
{
  "category": "llm",
  "message": "inference completed",
  "level": 1,
  "timestamp": "2025-01-27T12:34:58.456Z",
  "auxiliary": {
    "model": {
      "value": "gpt-4o",
      "type": "string"
    },
    "promptTokens": {
      "value": "3451",
      "type": "integer"
    },
    "completionTokens": {
      "value": "45",
      "type": "integer"
    }
  }
}
```
</Tab>

<Tab title="Error">
```json
{
  "category": "action",
  "message": "action failed: element not found",
  "level": 0,
  "timestamp": "2025-01-27T12:35:05.789Z",
  "auxiliary": {
    "selector": {
      "value": "#missing-btn",
      "type": "string"
    },
    "url": {
      "value": "https://example.com/form",
      "type": "string"
    }
  }
}
```
</Tab>
</Tabs>

</Accordion>

---

## Next Steps

Now that you have logging configured, explore additional debugging and monitoring tools in [the Observability guide](/v3/configuration/observability):

<CardGroup cols={2}>
<Card title="History API" icon="clock-rotate-left" href="/v3/best-practices/history">
Track all LLM operations (act, extract, observe, agent) with parameters, results, and timestamps. Perfect for debugging sequences and replaying workflows.
</Card>

<Card title="Metrics API" icon="chart-line" href="/v3/configuration/observability#real-time-metrics-%26-monitoring">
Monitor token usage and performance in real-time. Track costs per operation, identify expensive calls, and optimize resource usage.
</Card>

<Card title="LLM Inference Debugging" icon="microscope" href="/v3/configuration/logging#llm-inference-debugging">
Save complete LLM request/response dumps to disk. See exactly what DOM was sent to the LLM and why it made specific decisions.
</Card>

<Card title="Browserbase Session Monitoring" icon="video" href="/v3/configuration/observability#browserbase-session-monitoring">
Watch your automation visually with session recordings, network monitoring, and real-time browser inspection (Browserbase only).
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/configuration/models.mdx
================================================
---
title: Models
sidebarTitle: Models
description: Use any LLM model with Stagehand for optimal performance
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Understand web pages, plan actions, and interact with complex interfaces with Google, OpenAI, Anthropic, xAI, DeepSeek, Perplexity, Azure, Ollama, the [Vercel AI Gateway](https://vercel.com/docs/ai-gateway), or any other LLM model from [the Vercel AI SDK](https://sdk.vercel.ai/providers).

---

## Configuration Setup

### Quick Start

<Tip>
  Set your API key in `.env` and Stagehand handles the rest. No explicit
  configuration needed!
</Tip>

Get started with Google Gemini (recommended for speed and cost):

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "google/gemini-2.5-flash"
  // API key auto-loads from GOOGLE_GENERATIVE_AI_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>


---

### First Class Models

Use any model from the following supported providers.

<Tabs>
<Tab title="Google">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "google/gemini-2.5-flash"
  // API key auto-loads from GOOGLE_GENERATIVE_AI_API_KEY - set in your .env
});

await stagehand.init();
```

</CodeGroup>
[View all supported Google models →](https://ai.google.dev/gemini-api/docs/models)
</Tab>

<Tab title="Google Vertex">

<Warning>
Google Vertex requires `experimental: true` in the Stagehand constructor.
</Warning>

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  experimental: true, // required for Vertex
  model: {
    modelName: "vertex/gemini-3-flash-preview",
    project: "your-gcp-project-id",
    location: "us-central1",
    googleAuthOptions: {
      credentials: {
        client_email: "your-sa@project.iam.gserviceaccount.com",
        private_key: process.env.GOOGLE_SERVICE_ACCOUNT_PRIVATE_KEY,
      },
    },
  },
});

await stagehand.init();
```

</CodeGroup>

The `model` object accepts:
- `modelName` — The Vertex model, prefixed with `vertex/` (e.g. `vertex/gemini-3-flash-preview`)
- `project` — Your GCP project ID
- `location` — Your Vertex AI region (e.g. `us-central1`)
- `googleAuthOptions.credentials` — Service account credentials with `client_email` and `private_key`

[View all supported Vertex AI models →](https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models)
</Tab>

<Tab title="Anthropic">

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "anthropic/claude-haiku-4-5"
  // API key auto-loads from ANTHROPIC_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>
[View all supported Anthropic models →](https://docs.anthropic.com/en/docs/models-overview)
</Tab>

<Tab title="OpenAI">


<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "openai/gpt-5"
  // API key auto-loads from OPENAI_API_KEY - set in your .env
});

await stagehand.init();
```

</CodeGroup>
[View all supported OpenAI models →](https://platform.openai.com/docs/models)
</Tab>
<Tab title="Azure">

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "azure/gpt-5"
  // API key auto-loads from AZURE_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>
[View all supported Azure models →](https://ai.azure.com/catalog)
</Tab>

<Tab title="Cerebras">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "cerebras/llama-4-scout"
  // API key auto-loads from CEREBRAS_API_KEY - set in your .env
});

await stagehand.init();
```

</CodeGroup>
[View all supported Cerebras models →](https://inference-docs.cerebras.ai/models/overview)
</Tab>

<Tab title="DeepSeek">

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "deepseek/deepseek-chat"
  // API key auto-loads from DEEPSEEK_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>
[View all supported DeepSeek models →](https://api-docs.deepseek.com/quick_start/pricing)
</Tab>

<Tab title="Groq">


<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "groq/llama-3.1-8b-instant"
  // API key auto-loads from GROQ_API_KEY - set in your .env
});

await stagehand.init();
```

</CodeGroup>
[View all supported Groq models →](https://console.groq.com/docs/models)
</Tab>

<Tab title="Mistral">

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "mistral/codestral-2508"
  // API key auto-loads from MISTRAL_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>
[View all supported Mistral models →](https://docs.mistral.ai/getting-started/models)
</Tab>

<Tab title="Ollama">


<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "ollama/llama3.2"
  // No API key required
});

await stagehand.init();
```

</CodeGroup>
[View all supported Ollama models →](https://ollama.com/library)
</Tab>

<Tab title="Perplexity">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "perplexity/sonar-reasoning"
  // API key auto-loads from PERPLEXITY_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>
[View all supported Perplexity models →](https://docs.perplexity.ai/getting-started/models)
</Tab>
<Tab title="TogetherAI">
<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "togetherai/Qwen/Qwen3-235B-A22B-Instruct-2507-tput"
  // API key auto-loads from TOGETHER_AI_API_KEY - set in your .env
});

await stagehand.init();
```

</CodeGroup>
[View all supported TogetherAI models →](https://www.together.ai/models)

</Tab>
<Tab title="xAI">

<CodeGroup>
```typescript TypeScript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "xai/grok-4-fast-reasoning"
  // API key auto-loads from XAI_API_KEY - set in your .env
});

await stagehand.init();

```
</CodeGroup>

[View all xAI models →](https://docs.x.ai/docs/models)
</Tab>

</Tabs>

---

### Custom Models

Amazon Bedrock, Cohere, all [first class models](/v3/configuration/models#first-class-models), and any model from [the Vercel AI SDK](https://sdk.vercel.ai/providers) is supported.

Use this configuration for custom endpoints and custom retry or caching logic.

We'll use Amazon Bedrock and Google as examples below.

<AccordionGroup>
<Accordion title="Amazon Bedrock">

<Steps>
<Step title="Install dependencies">
Install the Vercel AI SDK for your provider.

<Tabs>
<Tab title="npm">
```bash
npm install @ai-sdk/amazon-bedrock
```

</Tab>
<Tab title="pnpm">
```bash
pnpm add @ai-sdk/amazon-bedrock
```
</Tab>
<Tab title="yarn">
```bash
yarn add @ai-sdk/amazon-bedrock
```
</Tab>
<Tab title="bun">
```bash
bun add @ai-sdk/amazon-bedrock
```
</Tab>
</Tabs>
</Step>

<Step title="Import, create provider, and create client">
```typescript
import { createAmazonBedrock } from '@ai-sdk/amazon-bedrock';
import { AISdkClient } from '@browserbasehq/stagehand';

const bedrockProvider = createAmazonBedrock({
  region: 'us-east-1',
  accessKeyId: 'xxxxxxxxx',
  secretAccessKey: 'xxxxxxxxx',
  sessionToken: 'xxxxxxxxx',
});

const bedrockClient = new AISdkClient({
  model: bedrockProvider("amazon/nova-pro-latest"),
});

```
</Step>

<Step title="Pass client to Stagehand">
```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  llmClient: bedrockClient
});

await stagehand.init();
```

</Step>
</Steps>
</Accordion>
<Accordion title="Google">

<Steps>
<Step title="Install dependencies">
Install the Vercel AI SDK for your provider.

<Tabs>
<Tab title="npm">
```bash
npm install @ai-sdk/google
```
</Tab>
<Tab title="pnpm">
```bash
pnpm add @ai-sdk/google
```
</Tab>
<Tab title="yarn">
```bash
yarn add @ai-sdk/google
```
</Tab>
<Tab title="bun">
```bash
bun add @ai-sdk/google
```
</Tab>
</Tabs>
</Step>

<Step title="Import, create provider, and create client">
```typescript
import { createGoogle } from '@ai-sdk/google';
import { AISdkClient } from '@browserbasehq/stagehand';

const googleProvider = createGoogle({
  apiKey: process.env.GEMINI_API_KEY,
});

const googleClient = new AISdkClient({
  model: googleProvider("google/gemini-2.5-flash"),
});

```
</Step>

<Step title="Pass client to Stagehand">
```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  llmClient: googleClient
});

await stagehand.init();
```

</Step>
</Steps>
</Accordion>
<Accordion title="All Providers">

To implement a custom model, follow the steps for the provider you are using. See the Amazon Bedrock and Google examples above. All supported providers and models are in [the Vercel AI SDK](https://sdk.vercel.ai/providers).

<Steps>
<Step title="Install dependencies">
Install the Vercel AI SDK for your provider.
</Step>
<Step title="Import, create provider, and create client">
```typescript
import { createProvider } from '@ai-sdk/provider';
import { AISdkClient } from '@browserbasehq/stagehand';

const provider = createProvider({
  apiKey: 'xxxxxxxxx',
});

const providerClient = new AISdkClient({
  model: provider("model/name"),
});

```
</Step>
<Step title="Pass client to Stagehand">
```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  llmClient: providerClient
});

await stagehand.init();
```

</Step>
</Steps>
</Accordion>
</AccordionGroup>


---

## Choose a Model

Different models excel at different tasks. Consider speed, accuracy, and cost for your use case.

<Card title="Model Selection Guide" href="https://www.stagehand.dev/evals" icon="scale-balanced">
  Find detailed model comparisons and recommendations on our Model Evaluation page.
</Card>

**Quick Recommendations**

| Use Case                  | Recommended Model                    | Why                            |
| ------------------------- | ------------------------------------ | ------------------------------ |
| **Production** | `google/gemini-2.5-flash`            | Fast, accurate, cost-effective |
| **Intelligence**     | `google/gemini-3-pro-preview` | Best accuracy on hard tasks    |
| **Speed**        | `google/gemini-2.5-flash`                 | Fastest response times         |
| **Cost**     | `google/gemini-2.5-flash`            | Best value per token           |
| **Local/offline**         | `ollama/qwen3`                    | No API costs, full control     |


---

## Advanced Options

### Agent Models (with CUA Support)

**Default**

The Stagehand agent by default uses the same model passed to Stagehand. All models ([first class](/v3/configuration/models#first-class-models) and [custom](/v3/configuration/models#custom-models)) are supported. Here's an example with Gemini:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "google/gemini-2.5-flash",
  // GOOGLE_GENERATIVE_AI_API_KEY is auto-loaded from .env
  // ... other stagehand options
});

// Agent will use google/gemini-2.5-flash
const agent = stagehand.agent();
```

**Override (with CUA support)**

However, the stagehand agent also accepts a `model` parameter, which accepts any [first class](/v3/configuration/models#first-class-models) model, including [computer use agents (CUA)](/v3/configuration/models#agent-models-with-cua-support). This is useful when you'd like the agent to use a different model than the one passed to Stagehand.

<Tip>
  To use a CUA model, you must pass the `mode: "cua"` parameter to the `agent()` method. If a non-CUA model is used, whether specified in Stagehand or overridden in the `agent()` method, an error will be thrown.
</Tip>

<Warning>
**Deprecation Notice:** The `cua: true` option is deprecated and will be removed in a future version. Use `mode: "cua"` instead.
</Warning>

<Tabs>
<Tab title="Google CUA">
```typescript
const agent = stagehand.agent({
  mode: "cua",
  model: "google/gemini-2.5-computer-use-preview-10-2025",
  // GOOGLE_GENERATIVE_AI_API_KEY is auto-loaded from .env
  // ... other agent options
});
```
</Tab>
<Tab title="Anthropic CUA">
```typescript
const agent = stagehand.agent({
  mode: "cua",
  model: "anthropic/claude-sonnet-4-6",
  // ANTHROPIC_API_KEY is auto-loaded from .env
  // ... other agent options
});
```
</Tab>
<Tab title="OpenAI CUA">
```typescript
const agent = stagehand.agent({
  mode: "cua",
  model: "openai/computer-use-preview",
  // OPENAI_API_KEY is auto-loaded from .env
  // ... other agent options
});
```
</Tab>
<Tab title="Example First Class Model">
All [first class models](/v3/configuration/models#first-class-models) are supported. Here's an example with Gemini:

```typescript
const agent = stagehand.agent({
  model: "google/gemini-2.5-pro",
  // GOOGLE_GENERATIVE_AI_API_KEY is auto-loaded from .env
  // ... other agent options
});
```
</Tab>
</Tabs>

<Accordion title="All Supported CUA Models">
| Provider | Model |
| -------- | ----- |
| Anthropic | `anthropic/claude-haiku-4-5-20251001` |
| Anthropic | `anthropic/claude-sonnet-4-6` |
| Anthropic | `anthropic/claude-sonnet-4-5-20250929` |
| Anthropic | `anthropic/claude-opus-4-5-20251101` |
| Anthropic | `anthropic/claude-opus-4-6` |
| Google   | `google/gemini-2.5-computer-use-preview-10-2025` |
| Google   | `google/gemini-3-flash-preview` |
| Google   | `google/gemini-3-pro-preview` |
| Microsoft | `microsoft/fara-7b` |
| OpenAI   | `openai/computer-use-preview` |
| OpenAI   | `openai/computer-use-preview-2025-03-11` |
</Accordion>

<Note>
  For overriding the agent API key, using a corporate proxy, adding provider-specific options, or other advanced use cases, the agent model can also take the form of an object. To learn more, see the [Agent Reference](/v3/references/agent).
</Note>
---

### Custom Endpoints

If you need Azure OpenAI deployments or enterprise deployments.

<Tabs>
<Tab title="OpenAI">

For OpenAI, you can pass configuration directly without using `llmClient` using the `model` parameter:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: {
    modelName: "openai/gpt-5",
    apiKey: process.env.OPENAI_API_KEY,
    baseURL: "https://custom-openai-endpoint.com/v1"
  }
});
```

</Tab>

<Tab title="Anthropic">

For Anthropic, you can pass configuration directly without using `llmClient` using the `model` parameter:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: {
    modelName: "anthropic/claude-haiku-4-5",
    apiKey: process.env.ANTHROPIC_API_KEY,
    baseURL: "https://custom-anthropic-endpoint.com",
  },
});
```

  </Tab>
<Tab title="All Other Providers">
For all other providers, use `llmClient`. Here's an example with Hugging Face:

```typescript
// pnpm add @ai-sdk/huggingface

import { createHuggingFace } from "@ai-sdk/huggingface";
import { AISdkClient } from "@browserbasehq/stagehand";

const huggingFaceProvider = createHuggingFace({
  apiKey: process.env.HUGGINGFACE_API_KEY,
  baseURL: "https://custom-huggingface-endpoint.com",
});

const huggingFaceClient = new AISdkClient({
  model: huggingFaceProvider("meta-llama/Llama-3.1-8B-Instruct"),
});

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  llmClient: huggingFaceClient,
});
```

</Tab>
</Tabs>

---

### AI Gateway

The [Vercel AI Gateway](https://vercel.com/docs/ai-gateway) lets you access models from multiple providers (OpenAI, Anthropic, Google, and more) through a single API key and interface. No extra provider SDKs or per-provider API keys needed.

<Tip>
  The AI Gateway is built into the `ai` package that Stagehand already uses -- no additional dependencies required.
</Tip>

**Key benefits:**
- Access models from all major providers with a single `AI_GATEWAY_API_KEY`
- Automatic provider fallback and dynamic routing based on uptime and latency
- Usage tracking and observability through the Vercel dashboard
- Bring Your Own Key (BYOK) support for existing provider credentials

<Tabs>
<Tab title="Simple">

Use the `gateway/` prefix followed by the provider and model name:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "gateway/openai/gpt-5"
  // API key auto-loads from AI_GATEWAY_API_KEY - set in your .env
});

await stagehand.init();
```

Works with any model available on the gateway:

```typescript
// Anthropic via gateway
model: "gateway/anthropic/claude-sonnet-4.5"

// Google via gateway
model: "gateway/google/gemini-3-flash-preview"
```

</Tab>
<Tab title="Custom Config">

Pass the API key and optional base URL explicitly using the model object format:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: {
    modelName: "gateway/openai/gpt-5",
    apiKey: process.env.AI_GATEWAY_API_KEY,
    baseURL: "https://ai-gateway.vercel.sh/v3/ai" // optional custom endpoint
  }
});

await stagehand.init();
```

</Tab>
</Tabs>

[View all available AI Gateway models →](https://vercel.com/docs/ai-gateway/models-and-providers)

---

### Extending the AI SDK Client

For advanced use cases like custom retries or caching logic, you can extend the `AISdkClient`:

```typescript
import { LLMClient } from "@browserbasehq/stagehand";

class CustomRetryClient extends LLMClient {
  async createChatCompletion(options) {
    let retries = 3;
    while (retries > 0) {
      try {
        return await super.createChatCompletion(options);
      } catch (error) {
        retries--;
        if (retries === 0) throw error;
        await new Promise((r) => setTimeout(r, 1000 * (4 - retries)));
      }
    }
  }
}
```

<Tip>
  Need custom caching? Consider using built-in [caching
  feature](/v3/best-practices/caching).
</Tip>

---

### Legacy Model Format

<Tip>
**Recommendation:** Use `provider/model` format. Example:
- `model: "openai/gpt-4o"` (recommended)
- `model: "gpt-4o"` (legacy)

</Tip>

The following models work without the `provider/` prefix in the model parameter as part of legacy support:

<AccordionGroup title="Legacy Model Format">
<Accordion title="Google">

- `gemini-2.5-flash-preview-04-17`
- `gemini-2.5-pro-preview-03-25`
- `gemini-2.0-flash`
- `gemini-2.0-flash-lite`
- `gemini-1.5-flash`
- `gemini-1.5-flash-8b`
- `gemini-1.5-pro`

</Accordion>
<Accordion title="Anthropic">

- `claude-sonnet-4-6`
- `claude-sonnet-4-5-20250929`
- `claude-haiku-4-5-20251001`

</Accordion>
<Accordion title="OpenAI">
- `gpt-4o`
- `gpt-4o-mini`
- `o1`
- `o1-mini`
- `o3`
- `o3-mini`
- `gpt-4.1`
- `gpt-4.1-mini`
- `gpt-4.1-nano`
- `o4-mini`
- `gpt-4.5-preview`
- `gpt-4o-2024-08-06`
- `o1-preview`

</Accordion>
<Accordion title="Cerebras">

- `cerebras-llama-3.3-70b`
- `cerebras-llama-3.1-8b`

</Accordion>
<Accordion title="Groq">

- `groq-llama-3.3-70b-versatile`
- `groq-llama-3.3-70b-specdec`
- `moonshotai/kimi-k2-instruct`

</Accordion>
</AccordionGroup>

---

## Troubleshooting

<AccordionGroup>
<Accordion title="Error: API key not found">
**Error:** `API key not found`

**Solutions:**

- Check `.env` file has the correct variable name for the provider you are using
- Ensure environment variables are loaded (use `dotenv`)
- Restart your application after updating `.env` file

| Provider   | Environment Variable           |
| ---------- | ------------------------------ |
| Google     | `GOOGLE_GENERATIVE_AI_API_KEY` or `GEMINI_API_KEY` |
| Vertex | Service account credentials (see [setup](#first-class-models)) |
| Anthropic  | `ANTHROPIC_API_KEY`            |
| OpenAI     | `OPENAI_API_KEY`               |
| Azure      | `AZURE_API_KEY`                |
| Cerebras   | `CEREBRAS_API_KEY`             |
| DeepSeek   | `DEEPSEEK_API_KEY`             |
| Groq       | `GROQ_API_KEY`                 |
| Mistral    | `MISTRAL_API_KEY`              |
| Ollama     | None (local)                   |
| Perplexity | `PERPLEXITY_API_KEY`           |
| TogetherAI | `TOGETHER_AI_API_KEY`          |
| xAI        | `XAI_API_KEY`                  |
| AI Gateway | `AI_GATEWAY_API_KEY`           |

</Accordion>

<Accordion title="Error: Model not supported">
**Error:** `Unsupported model`

**Solutions:**

- Use the `provider/model` format: `openai/gpt-5`
- Verify the model name exists in the provider's documentation
- Check model name is spelled correctly
- Ensure your Model API key can access the model
</Accordion>

<Accordion title="Model doesn't support structured outputs">
**Error:** `Model does not support structured outputs`

**Solutions:**

- Check our [Model Evaluation page](https://www.stagehand.dev/evals) for recommended models
</Accordion>

<Accordion title="High costs or slow performance">
**Symptoms:** Automation is expensive or slow

**Solutions:**

- Switch to cost-effective models (check [evals](https://www.stagehand.dev/evals) for comparisons)
- Use faster models for simple tasks, powerful ones for complex tasks
- Implement [caching](/v3/best-practices/caching) for repeated patterns
</Accordion>
<Accordion title="Python SDK or custom models">
Python is now supported in Stagehand v3! The Python SDK uses a BYOB (Bring Your Own Browser) architecture.

**Solutions:**

- See the [Python SDK documentation](/v3/sdk/python) for installation and usage
- Check the [Python migration guide](/v3/migrations/python) if upgrading from v2
</Accordion>
</AccordionGroup>

### Need Help? Contact Support

Can't find a solution? Have a question? Reach out to our support team:

<Card
  title="Contact Support"
  icon="envelope"
  href="mailto:support@browserbase.com"
>
  Email us at support@browserbase.com
</Card>

---

## Next Steps

<CardGroup cols={2}>
<Card title="Prompting Guide" href="/v3/best-practices/prompting-best-practices" icon="brain">
  Learn how to prompt LLMs for optimal results
</Card>
<Card title="Run Evals" href="/v3/basics/evals" icon="flask-vial">
  Test which models work best for your specific use case
</Card>

<Card title="Caching Guide" href="/v3/best-practices/caching" icon="database">
  Cache responses to reduce costs and improve speed
</Card>
<Card
  title="Optimize Costs"
  href="/v3/best-practices/cost-optimization"
  icon="dollar-sign"
>
  Reduce LLM spending with caching and smart model selection
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/configuration/observability.mdx
================================================
---
title: Observability
sidebarTitle: Observability
description: Track Stagehand automation with session visibility and analytics
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Stagehand provides powerful observability features to help you monitor, track performance, and analyze your browser automation workflows. Focus on session monitoring, resource usage, and operational insights for both Browserbase and local environments.

## Browserbase Session Monitoring

When running on Browserbase, you gain access to comprehensive cloud-based monitoring and session management through the Browserbase API and dashboard.

<div style={{ textAlign: "center" }}>
  <img src="/media/observability.gif" alt="Browserbase Session Observability" width="400" />
</div>

### Live Session Visibility

Browserbase provides real-time visibility into your automation sessions:

**Session Dashboard Features**
- Real-time browser screen recording and replay
- Network request monitoring with detailed timing
- JavaScript console logs and error tracking
- CPU and memory usage metrics
- Session status and duration tracking

**Session Management & API Access**
```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { Browserbase } from "@browserbasehq/sdk";

const browserbase = new Browserbase({
  apiKey: process.env.BROWSERBASE_API_KEY,
});

const stagehand = new Stagehand({
  env: "BROWSERBASE"
});

await stagehand.init();

const sessionInfo = await browserbase.sessions.retrieve(stagehand.sessionId);

console.log("Session status:", sessionInfo.status);
console.log("Session region:", sessionInfo.region);
console.log("CPU usage:", sessionInfo.avgCpuUsage);
console.log("Memory usage:", sessionInfo.memoryUsage);
console.log("Proxy bytes:", sessionInfo.proxyBytes);
```

### Session Analytics & Insights

<CardGroup>
  <Card title="Real-Time Monitoring" icon="chart-line">
    Monitor live session status, resource usage, and geographic distribution. Scale and manage concurrent sessions with real-time insights.
  </Card>

  <Card title="Session Recordings" icon="video">
    Review complete session recordings with frame-by-frame playback. Analyze network requests and debug browser interactions visually.
  </Card>

  <Card title="API Management" icon="code">
    Programmatically access session data, automate lifecycle management, and integrate with monitoring systems through our API.
  </Card>

  <Card title="Usage Monitoring" icon="chart-bar">
    Track resource consumption, session duration, and API usage. Get detailed breakdowns of costs and utilization across your automation.
  </Card>
</CardGroup>

### Session Monitoring & Filtering

Query and monitor sessions by status and metadata:

```typescript
import { Browserbase } from "@browserbasehq/sdk";

const browserbase = new Browserbase({
  apiKey: process.env.BROWSERBASE_API_KEY,
});

// List sessions with filtering
async function getFilteredSessions() {
  const sessions = await browserbase.sessions.list({
    status: 'RUNNING'
  });
  
  return sessions.map(session => ({
    id: session.id,
    status: session.status, // RUNNING, COMPLETED, ERROR, TIMED_OUT
    startedAt: session.startedAt,
    endedAt: session.endedAt,
    region: session.region,
    avgCpuUsage: session.avgCpuUsage,
    memoryUsage: session.memoryUsage,
    proxyBytes: session.proxyBytes,
    userMetadata: session.userMetadata
  }));
}

// Query sessions by metadata
async function querySessionsByMetadata(query: string) {
  const sessions = await browserbase.sessions.list({
    q: query
  });
  
  return sessions;
}
```

## Local Environment Monitoring

For local development, Stagehand provides performance monitoring and resource tracking capabilities directly on your machine.

### Performance Tracking

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  verbose: 1, // Monitor performance without debug noise
});

await stagehand.init();

// Track local automation metrics
const startTime = Date.now();
const initialMetrics = await stagehand.metrics;

// ... perform automation tasks
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");
await stagehand.act("click button");
await stagehand.extract({ instruction: "get data", schema: DataSchema });

const finalMetrics = await stagehand.metrics;
const executionTime = Date.now() - startTime;

console.log('Local Performance Summary:', {
  executionTime: `${executionTime}ms`,
  totalTokens: finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens,
  totalInferenceTime: `${finalMetrics.totalInferenceTimeMs}ms`,
  tokensPerSecond: ((finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens) / (executionTime / 1000)).toFixed(2)
});
```

## Resource Usage Monitoring

When running locally, monitor system resource usage and browser performance:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import * as os from 'os';
import { performance } from 'perf_hooks';

class LocalResourceMonitor {
  private cpuUsage: number[] = [];
  private memoryUsage: number[] = [];
  
  startMonitoring() {
    const interval = setInterval(() => {
      // Track system resources
      const memUsage = process.memoryUsage();
      this.memoryUsage.push(memUsage.heapUsed / 1024 / 1024); // MB
      
      // Track CPU (simplified)
      const loadAvg = os.loadavg()[0];
      this.cpuUsage.push(loadAvg);
    }, 1000);
    
    return interval;
  }
  
  getResourceSummary() {
    return {
      avgMemoryUsage: this.memoryUsage.reduce((a, b) => a + b, 0) / this.memoryUsage.length,
      peakMemoryUsage: Math.max(...this.memoryUsage),
      avgCpuLoad: this.cpuUsage.reduce((a, b) => a + b, 0) / this.cpuUsage.length,
      totalDataPoints: this.cpuUsage.length
    };
  }
}

const monitor = new LocalResourceMonitor();
const interval = monitor.startMonitoring();

const stagehand = new Stagehand({ env: "LOCAL" });

// ... run automation

clearInterval(interval);
console.log('Resource Usage:', monitor.getResourceSummary());
```


  <Card title="LLM Usage" icon="chart-line" href="/v3/basics/evals">
    Monitor token usage, costs, and speed. Set up automated alerting for critical failures. Implement cost tracking across different environments. Use session analytics to optimize automation workflows.
  </Card>


## Real-Time Metrics & Monitoring

### Basic Usage Tracking

Monitor your automation's resource usage in real-time with `stagehand.metrics`:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();

// Metrics are async in V3
const metrics = await stagehand.metrics;
console.log(metrics);

// Monitor during automation
const startTime = Date.now();
const initialMetrics = await stagehand.metrics;

// ... perform automation tasks
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");
await stagehand.act("click the login button");
const data = await stagehand.extract({
  instruction: "extract user info",
  schema: UserSchema
});

const finalMetrics = await stagehand.metrics;
const executionTime = Date.now() - startTime;

console.log('Automation Summary:', {
  totalTokens: finalMetrics.totalPromptTokens + finalMetrics.totalCompletionTokens,
  executionTime: `${executionTime}ms`,
  avgInferenceTime: `${finalMetrics.totalInferenceTimeMs / 3}ms`,
});
```

### Understanding Metrics Data

The metrics object provides detailed breakdown by Stagehand operation:

```typescript
interface StagehandMetrics {
  // Act operation metrics
  actPromptTokens: number;
  actCompletionTokens: number;
  actReasoningTokens: number;
  actCachedInputTokens: number;
  actInferenceTimeMs: number;

  // Extract operation metrics
  extractPromptTokens: number;
  extractCompletionTokens: number;
  extractReasoningTokens: number;
  extractCachedInputTokens: number;
  extractInferenceTimeMs: number;

  // Observe operation metrics
  observePromptTokens: number;
  observeCompletionTokens: number;
  observeReasoningTokens: number;
  observeCachedInputTokens: number;
  observeInferenceTimeMs: number;

  // Agent operation metrics
  agentPromptTokens: number;
  agentCompletionTokens: number;
  agentReasoningTokens: number;
  agentCachedInputTokens: number;
  agentInferenceTimeMs: number;

  // Cumulative totals
  totalPromptTokens: number;
  totalCompletionTokens: number;
  totalReasoningTokens: number;
  totalCachedInputTokens: number;
  totalInferenceTimeMs: number;
}
```

**Example metrics output:**

```typescript
const metrics = await stagehand.metrics;
console.log(metrics);

// {
//   actPromptTokens: 4011,
//   actCompletionTokens: 51,
//   actReasoningTokens: 12,
//   actCachedInputTokens: 0,
//   actInferenceTimeMs: 1688,
//   extractPromptTokens: 4200,
//   extractCompletionTokens: 243,
//   extractReasoningTokens: 18,
//   extractCachedInputTokens: 0,
//   extractInferenceTimeMs: 4297,
//   observePromptTokens: 347,
//   observeCompletionTokens: 43,
//   observeReasoningTokens: 5,
//   observeCachedInputTokens: 0,
//   observeInferenceTimeMs: 903,
//   agentPromptTokens: 0,
//   agentCompletionTokens: 0,
//   agentReasoningTokens: 0,
//   agentCachedInputTokens: 0,
//   agentInferenceTimeMs: 0,
//   totalPromptTokens: 8558,
//   totalCompletionTokens: 337,
//   totalReasoningTokens: 35,
//   totalCachedInputTokens: 0,
//   totalInferenceTimeMs: 6888
// }
```

## Best Practices

<AccordionGroup>
<Accordion title="Production Monitoring">
- Track session success rates and failure patterns
- Monitor resource usage and scaling requirements
- Set up automated alerting for critical failures
- Implement cost tracking across different environments
- Use session analytics to optimize automation workflows
</Accordion>

<Accordion title="Performance Optimization">
- Compare Browserbase vs local execution times
- Monitor token usage and inference costs across models
- Track geographic performance differences
- Identify bottlenecks in automation workflows
- Optimize for cost-effectiveness and speed
</Accordion>

<Accordion title="Operational Insights">
- Track session distribution across regions
- Monitor concurrent session limits and scaling
- Analyze failure patterns and common error scenarios
- Use session recordings for root cause analysis
- Implement custom metadata for workflow categorization
</Accordion>

<Accordion title="Integration & Alerting">
- Integrate session APIs with monitoring dashboards
- Set up automated notifications for session failures  
- Track SLA compliance and performance benchmarks
- Monitor resource costs and usage patterns
- Use analytics data for capacity planning and optimization
</Accordion>
</AccordionGroup>

## Next Steps

<CardGroup cols={2}>
<Card title="History Tracking" icon="clock-rotate-left" href="/v3/best-practices/history">
  Track all LLM operations with parameters, results, and timestamps for debugging.
</Card>
<Card title="Logging" icon="file-lines" href="/v3/configuration/logging">
  Configure logging levels, custom loggers, and file-based session logging.
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/first-steps/ai-rules.mdx
================================================
---
title: AI Rules
description: Using AI to write Stagehand code faster, and better.
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


You're likely using AI to write code, and there's a **right and wrong way to do it.** This page is a collection of rules, configs, and copy‑paste snippets to allow your AI agents/assistants to write performant, Stagehand code as fast as possible. 

## Quickstart

<CardGroup cols={2}>
  <Card title="Add MCP servers" icon="screwdriver-wrench">
    Configure Browserbase (Stagehand), Context7, DeepWiki, and Stagehand Docs in your MCP client. 
  </Card>
  <Card title="Pin editor rules" icon="memo">
    Drop in `cursorrules` and `claude.md` so AI agents/assistants always emit Stagehand patterns. 
  </Card>
</CardGroup>

## Using MCP Servers

MCP (Model Context Protocol) servers act as intermediaries that connect AI systems to external data sources and tools. These servers enable your coding assistant to access real-time information, execute tasks, and retrieve structured data to enhance code generation accuracy.

The following **MCP servers** provide specialized access to Stagehand documentation and related resources:

<Accordion title="Context7 by Upstash" icon="database">
Provides semantic search across documentation and codebase context. Context7 enables AI assistants to find relevant code patterns, examples, and implementation details from your project history. It maintains contextual understanding of your development workflow and can surface related solutions from previous work.

**Installation:**
```json
{
  "mcpServers": {
    "context7": {
      "command": "npx",
      "args": ["-y", "@upstash/context7-mcp"]
    }
  }
}
```
</Accordion>

<Accordion title="DeepWiki by Cognition" icon="book-open">
Offers deep indexing of GitHub repositories and documentation. DeepWiki allows AI agents to understand project architecture, API references, and best practices from the entire Stagehand ecosystem. It provides comprehensive knowledge about repository structure, code relationships, and development patterns.

**Installation:**
```json
{
  "mcpServers": {
    "deepwiki": {
      "url": "https://mcp.deepwiki.com/mcp"
    }
  }
}
```
</Accordion>

<Accordion title="Stagehand Docs by Mintlify" icon="mintbit">
Direct access to official Stagehand documentation. This MCP server provides AI assistants with up-to-date API references, configuration options, and usage examples for accurate code generation. Mintlify auto-generates this server from the official docs, ensuring your AI assistant always has the latest information.

**Usage:**
```json
{
  "mcpServers": {
    "stagehand-docs": {
      "url": "https://docs.stagehand.dev/mcp"
    }
  }
}
```
</Accordion>

**How MCP Servers Enhance Your Development:**
- **Real-time Documentation Access**: AI assistants can query the latest Stagehand docs, examples, and best practices
- **Context-Aware Code Generation**: Servers provide relevant code patterns and configurations based on your specific use case
- **Reduced Integration Overhead**: Standardized protocol eliminates the need for custom integrations with each documentation source
- **Enhanced Accuracy**: AI agents receive structured, up-to-date information rather than relying on potentially outdated training data

<Tip>
**Prompting tip:** 
Explicitly ask your coding agent/assistant to use these MCP servers to fetch relevant information from the docs so they have better context and know how to write proper Stagehand code. 

ie. **"Use the stagehand-docs MCP to fetch the act/observe guidelines, then generate code that follows them. Prefer cached observe results."**
</Tip>

## Editor rule files (copy‑paste)

Drop these in `.cursorrules`, `windsurfrules`, `claude.md`, or any agent rule framework:

<Accordion title="TypeScript">

``````md
# Stagehand Project

This is a project that uses Stagehand V3, a browser automation framework with AI-powered `act`, `extract`, `observe`, and `agent` methods.

The main class can be imported as `Stagehand` from `@browserbasehq/stagehand`.

**Key Classes:**

- `Stagehand`: Main orchestrator class providing `act`, `extract`, `observe`, and `agent` methods
- `context`: A `V3Context` object that manages browser contexts and pages
- `page`: Individual page objects accessed via `stagehand.context.pages()[i]` or created with `stagehand.context.newPage()`

## Initialize

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL", // or "BROWSERBASE"
  verbose: 2, // 0, 1, or 2
  model: "openai/gpt-4.1-mini", // or any supported model
});

await stagehand.init();

// Access the browser context and pages
const page = stagehand.context.pages()[0];
const context = stagehand.context;

// Create new pages if needed
const page2 = await stagehand.context.newPage();
```

## Act

Actions are called on the `stagehand` instance (not the page). Use atomic, specific instructions:

```typescript
// Act on the current active page
await stagehand.act("click the sign in button");

// Act on a specific page (when you need to target a page that isn't currently active)
await stagehand.act("click the sign in button", { page: page2 });
```

**Important:** Act instructions should be atomic and specific:

- ✅ Good: "Click the sign in button" or "Type 'hello' into the search input"
- ❌ Bad: "Order me pizza" or "Type in the search bar and hit enter" (multi-step)

### Observe + Act Pattern (Recommended)

Cache the results of `observe` to avoid unexpected DOM changes:

```typescript
const instruction = "Click the sign in button";

// Get candidate actions
const actions = await stagehand.observe(instruction);

// Execute the first action
await stagehand.act(actions[0]);
```

To target a specific page:

```typescript
const actions = await stagehand.observe("select blue as the favorite color", {
  page: page2,
});
await stagehand.act(actions[0], { page: page2 });
```

## Extract

Extract data from pages using natural language instructions. The `extract` method is called on the `stagehand` instance.

### Basic Extraction (with schema)

```typescript
import { z } from "zod";

// Extract with explicit schema
const data = await stagehand.extract(
  "extract all apartment listings with prices and addresses",
  z.object({
    listings: z.array(
      z.object({
        price: z.string(),
        address: z.string(),
      }),
    ),
  }),
);

console.log(data.listings);
```

### Simple Extraction (without schema)

```typescript
// Extract returns a default object with 'extraction' field
const result = await stagehand.extract("extract the sign in button text");

console.log(result);
// Output: { extraction: "Sign in" }

// Or destructure directly
const { extraction } = await stagehand.extract(
  "extract the sign in button text",
);
console.log(extraction); // "Sign in"
```

### Targeted Extraction

Extract data from a specific element using a selector:

```typescript
const reason = await stagehand.extract(
  "extract the reason why script injection fails",
  z.string(),
  { selector: "/html/body/div[2]/div[3]/iframe/html/body/p[2]" },
);
```

### URL Extraction

When extracting links or URLs, use `z.string().url()`:

```typescript
const { links } = await stagehand.extract(
  "extract all navigation links",
  z.object({
    links: z.array(z.string().url()),
  }),
);
```

### Extracting from a Specific Page

```typescript
// Extract from a specific page (when you need to target a page that isn't currently active)
const data = await stagehand.extract(
  "extract the placeholder text on the name field",
  { page: page2 },
);
```

## Observe

Plan actions before executing them. Returns an array of candidate actions:

```typescript
// Get candidate actions on the current active page
const [action] = await stagehand.observe("Click the sign in button");

// Execute the action
await stagehand.act(action);
```

Observing on a specific page:

```typescript
// Target a specific page (when you need to target a page that isn't currently active)
const actions = await stagehand.observe("find the next page button", {
  page: page2,
});
await stagehand.act(actions[0], { page: page2 });
```

## Agent

Use the `agent` method to autonomously execute complex, multi-step tasks.

### Basic Agent Usage

```typescript
const page = stagehand.context.pages()[0];
await page.goto("https://www.google.com");

const agent = stagehand.agent({
  model: "google/gemini-2.0-flash",
  executionModel: "google/gemini-2.0-flash",
});

const result = await agent.execute({
  instruction: "Search for the stock price of NVDA",
  maxSteps: 20,
});

console.log(result.message);
```

### Computer Use Agent (CUA)

For more advanced scenarios using computer-use models:

```typescript
const agent = stagehand.agent({
  mode: "cua", // Enable Computer Use Agent mode
  model: "anthropic/claude-sonnet-4-20250514",
  // or "google/gemini-2.5-computer-use-preview-10-2025"
  systemPrompt: `You are a helpful assistant that can use a web browser.
    Do not ask follow up questions, the user will trust your judgement.`,
});

await agent.execute({
  instruction: "Apply for a library card at the San Francisco Public Library",
  maxSteps: 30,
});
```

### Agent with Custom Model Configuration

```typescript
const agent = stagehand.agent({
  mode: "cua",
  model: {
    modelName: "google/gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GEMINI_API_KEY,
  },
  systemPrompt: `You are a helpful assistant.`,
});
```

### Agent with Integrations (MCP/External Tools)

```typescript
const agent = stagehand.agent({
  integrations: [`https://mcp.exa.ai/mcp?exaApiKey=${process.env.EXA_API_KEY}`],
  systemPrompt: `You have access to the Exa search tool.`,
});
```

## Advanced Features

### DeepLocator (XPath Targeting)

Target specific elements across shadow DOM and iframes:

```typescript
await page
  .deepLocator("/html/body/div[2]/div[3]/iframe/html/body/p")
  .highlight({
    durationMs: 5000,
    contentColor: { r: 255, g: 0, b: 0 },
  });
```

### Multi-Page Workflows

```typescript
const page1 = stagehand.context.pages()[0];
await page1.goto("https://example.com");

const page2 = await stagehand.context.newPage();
await page2.goto("https://example2.com");

// Act/extract/observe operate on the current active page by default
// Pass { page } option to target a specific page
await stagehand.act("click button", { page: page1 });
await stagehand.extract("get title", { page: page2 });
```
``````

</Accordion>

<Accordion title="Python">

``````md
# Stagehand Python Project

This is a project that uses [Stagehand Python](https://github.com/browserbase/stagehand-python), which provides AI-powered browser automation with `act`, `extract`, and `observe` methods.

`Stagehand` is a class that provides configuration and browser automation capabilities with:
- Pages accessed via `stagehand.context.pages()` or `stagehand.context.activePage()`
- `stagehand.context`: A StagehandContext object (extends Playwright BrowserContext)
- `stagehand.agent()`: Create AI-powered agents for autonomous multi-step workflows
- `stagehand.init()`: Initialize the browser session
- `stagehand.close()`: Clean up resources

`Page` extends Playwright's Page class with AI-powered methods:
- `act()`: Perform actions on web elements using natural language
- `extract()`: Extract structured data from pages using schemas
- `observe()`: Plan actions and get selectors before executing

`Agent` provides autonomous Computer Use Agent capabilities:
- `execute()`: Perform complex multi-step tasks using natural language instructions

Use the following rules to write code for this project.

- To plan an instruction like "click the sign in button", use Stagehand `observe` to get the action to execute.

You can also pass in the following params:

- The result of `observe` is a list of `ObserveResult` objects that can directly be used as params for `act` like this:
  
- When writing code that needs to extract data from the page, use Stagehand `extract`. Use Pydantic models for schemas:

## Initialize

### Configuration Options

Key configuration options in `StagehandConfig`:

## Act

You can act directly with string instructions:

Use variables for dynamic form filling:

**Best Practices:**
- Cache the results of `observe` to avoid unexpected DOM changes
- Keep actions atomic and specific (e.g., "Click the sign in button" not "Sign in to the website")
- Use specific, descriptive instructions

Act `action` should be as atomic and specific as possible, i.e. "Click the sign in button" or "Type 'hello' into the search input".
AVOID actions that are more than one step, i.e. "Order me pizza" or "Send an email to Paul asking him to call me".

## Extract

### Simple String Extraction

### Structured Extraction with Schema (Recommended)
Always use Pydantic models for structured data extraction:

### Array Extraction
For arrays, use List types:

### Complex Object Extraction
For more complex data structures:

## Agent System

Stagehand provides an Agent System for autonomous web browsing using Computer Use Agents (CUA).

### Creating Agents

### Agent Execution

**Best Practices:**
- Be specific with instructions: `"Fill out the contact form with name 'John Doe' and submit it"`
- Break down complex tasks into smaller steps
- Use error handling with try/except blocks
- Combine agents for navigation with traditional methods for precise data extraction

## Project Structure Best Practices

- Store configurations in environment variables or config files
- Use async/await patterns consistently
- Implement main automation logic in async functions
- Use async context managers for resource management
- Use type hints and Pydantic models for data validation
- Handle exceptions appropriately with try/except blocks
``````

</Accordion>

## Security notes

- Do not embed secrets in docs or rule files; use env vars in MCP configs.
- Avoid broad actions that may trigger unintended navigation; prefer `observe` first.

## Resources/references

- Context7 MCP (Upstash)
  - https://github.com/upstash/context7
- DeepWiki MCP
  - https://mcp.deepwiki.com/
- Stagehand Docs MCP (Mintlify)
  - https://docs.stagehand.dev/mcp


================================================
FILE: packages/docs/v3/first-steps/installation.mdx
================================================
---
title: Installation
description: Integrate Stagehand into an existing project.
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Install Stagehand in your current app with the TypeScript SDK.

<Tip>
We recommend using the Node.js runtime environment to run Stagehand scripts.

**Bun is now supported** as long as you do not integrate Stagehand with Playwright. Playwright is not compatible with Bun.
</Tip>

<Tabs>
<Tab title="TypeScript">

### Install dependencies

<CodeGroup>
```bash npm
npm install @browserbasehq/stagehand
```

```bash pnpm
pnpm add @browserbasehq/stagehand
```

```bash yarn
yarn add @browserbasehq/stagehand
```
```bash bun icon="sparkles"
bun add @browserbasehq/stagehand
```
</CodeGroup>

<Tip>
If you plan to run locally, you need to have [Chrome](https://www.google.com/chrome/) installed on your machine. For cloud browser sessions, skip this.
</Tip>

### Configure environment

Set environment variables (or a `.env` via your framework):

<CodeGroup>
```bash Bash
OPENAI_API_KEY=your_api_key
BROWSERBASE_API_KEY=your_api_key
BROWSERBASE_PROJECT_ID=your_project_id
```
</CodeGroup>

<Note>
Stagehand does not auto-load `.env` files.

If you use a `.env` file, install and initialize `dotenv` in your own app code:

```bash
npm install dotenv
```

```typescript
import dotenv from "dotenv";
dotenv.config({ path: ".env" });
```
</Note>

### Use in your codebase

Add Stagehand where you need browser automation.

```typescript
import dotenv from "dotenv";
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod";

dotenv.config({ path: ".env" });  // if needed

async function main() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE"
  });

  await stagehand.init();
  const page = stagehand.context.pages()[0];

  await page.goto("https://example.com");

  // Act on the page
  await stagehand.act("Click the learn more button");

  // Extract structured data
  const description = await stagehand.extract("extract the description", z.string());

  console.log(description);
  await stagehand.close();
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});
```

</Tab>

<Tab title="Other Languages">

<Note>
For Python and other language SDKs, use the **language selector** in the top left corner of the sidebar to view the SDK documentation for your language.
</Note>

</Tab>

</Tabs>

## Next steps

<CardGroup cols={2}>
  <Card 
    title="Configuration"
    icon="gear"
    href="/v3/configuration/browser"
  >
    Environment, Browserbase vs Local, logging, timeouts, LLM customization
  </Card>
  <Card 
    title="Act"
    icon="arrow-pointer"
    href="/v3/basics/act"
  >
    Perform precise actions with natural language
  </Card>
  <Card 
    title="Extract"
    icon="download"
    href="/v3/basics/extract"
  >
    Typed data extraction with Zod schemas
  </Card>
  <Card 
    title="Observe"
    icon="eye"
    href="/v3/basics/observe"
  >
    Discover elements and suggested actions
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/first-steps/introduction.mdx
================================================
---
title: Introducing Stagehand
sidebarTitle: Introduction
description: Developers use Stagehand to reliably automate the web.
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## The Problem with Browser Automation

Traditional frameworks like Playwright and Puppeteer force you to write brittle scripts that break with every UI change. Web agents promise to solve this with AI, but leave you at the mercy of unpredictable behavior.

**You're stuck between two bad options:**
- **Too brittle**: Traditional selectors break when websites change
- **Too agentic**: AI agents are unpredictable and impossible to debug

## Enter Stagehand

Stagehand gives you the best of both worlds through four powerful primitives that let you choose exactly how much AI to use:

<CardGroup cols={2}>
  <Card title="Act" icon="play" href="/v3/basics/act">
    Execute actions using natural language
  </Card>
  <Card title="Extract" icon="database" href="/v3/basics/extract">
    Pull structured data with schemas
  </Card>
  <Card title="Observe" icon="eye" href="/v3/basics/observe">
    Discover available actions on any page
  </Card>
  <Card title="Agent" icon="robot" href="/v3/basics/agent">
    Automate entire workflows autonomously
  </Card>
</CardGroup>

```typescript
// Act - Execute natural language actions
await stagehand.act("click the login button");

// Extract - Pull structured data
const price = await stagehand.extract(
  "extract the price",
  z.number()
);

// Observe - Discover available actions
const actions = await stagehand.observe("find submit buttons");

// Agent - Automate entire workflows
const agent = stagehand.agent({
  mode: "cua",
  model: "google/gemini-2.5-computer-use-preview-10-2025",
});
await agent.execute("apply for this job");
```


## Why Developers Choose Stagehand

- **Precise Control**: Mix AI-powered actions with deterministic code. You decide exactly how much AI to use.

- **Actually Repeatable**: Save and replay actions exactly. No more "it worked on my machine" with browser automations.

- **Maintainable at Scale**: One script can automate multiple websites. When sites change, your automations adapt.

- **Composable Tools**: Choose your level of automation with Act, Extract, Observe, and Agent.

## Built for Modern Development
Stagehand is designed for developers building production browser automations and AI agents that need reliable web access.

<AccordionGroup>
  <Accordion title="Works Everywhere">
    Compatible with all Chromium-based browsers: Chrome, Edge, Arc, Brave, and more.
  </Accordion>
  <Accordion title="Built by Browserbase">
    Created and maintained by the team behind enterprise browser infrastructure.
  </Accordion>
</AccordionGroup>

## Get Started in 60 Seconds
<Info>
  **Pro tip**: For best results, we recommend using Stagehand with [Browserbase](https://www.browserbase.com) for reliable cloud browser infrastructure.
</Info>
<CardGroup cols={2}>
  <Card
    title="Quickstart"
    icon="rocket"
    href="/v3/first-steps/quickstart"
  >
    Build your first automation in under a minute
  </Card>
  <Card
    title="Try Director"
    icon="wand-magic-sparkles"
    href="https://www.director.ai"
  >
    Generate Stagehand scripts with AI
  </Card>
  <Card
    title="View Templates"
    icon="code"
    href="https://www.browserbase.com/templates"
  >
    See real-world automation examples
  </Card>
  <Card
    title="Join Discord"
    icon="discord"
    href="https://stagehand.dev/discord"
  >
    Get help from the community
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/first-steps/quickstart.mdx
================================================
---
title: Quickstart
description: 'Stagehand allows you to build web automations with natural language and code.'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


If this is your **first time using Stagehand**, you should try [Director](https://director.ai) first. It's an agent that allows you to build Stagehand workflows using natural language. You can also try Stagehand using our [MCP server](/v3/integrations/mcp/introduction).

Otherwise, the quickest way to start with Stagehand is with our CLI. It scaffolds a ready‑to‑run Stagehand app with sensible defaults, and an example script.

<Note>
This quickstart is for **TypeScript**. For other languages, change the language selector in the top left corner.
</Note>

## 1) Create a sample project

<CodeGroup>
```bash Bash
npx create-browser-app
```
</CodeGroup>

## 2) Run it

Follow the CLI prompts to enter the project directory and add your API keys. Then run the example script.

<CodeGroup>
```bash Bash
cd my-stagehand-app # Enter the project directory
cp .env.example .env  # Add your API keys
npm start # Run the example script
```
</CodeGroup>

## 3) Use Stagehand (act, extract, observe)

The scaffold includes an index.ts file that contains the example script. Here's what it looks like:

<CodeGroup>
```typescript TypeScript
import "dotenv/config";
import { Stagehand } from "@browserbasehq/stagehand";

async function main() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE"
  });

  await stagehand.init();

  console.log(`Stagehand Session Started`);
  console.log(`Watch live: https://browserbase.com/sessions/${stagehand.browserbaseSessionID}`);

  const page = stagehand.context.pages()[0];

  await page.goto("https://stagehand.dev");

  const extractResult = await stagehand.extract("Extract the value proposition from the page.");
  console.log(`Extract result:\n`, extractResult);

  await stagehand.act("Click the 'Evals' button.");

  const observeResult = await stagehand.observe("What can I click on this page?");
  console.log(`Observe result:\n`, observeResult);

  const agent = stagehand.agent({
    mode: "cua",
    model: "google/gemini-2.5-computer-use-preview-10-2025",
    systemPrompt: "You're a helpful assistant that can control a web browser.",
  });

  const agentResult = await agent.execute("What is the most accurate model to use in Stagehand?");
  console.log(`Agent result:\n`, agentResult);

  await stagehand.close();
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});

```
</CodeGroup>

<Tip>
To use, set provider keys in `.env` (e.g., `OPENAI_API_KEY`). For cloud browsers, add `BROWSERBASE_API_KEY` and `BROWSERBASE_PROJECT_ID`.
</Tip>

## Next steps

Learn about the Stagehand primitives: act, extract, observe, and agent.

<CardGroup cols={2}>
  <Card 
    title="Act" 
    icon="arrow-pointer" 
    href="/v3/basics/act"
  >
    Perform actions on web pages with natural language
  </Card>
  
  <Card 
    title="Extract" 
    icon="download" 
    href="/v3/basics/extract"
  >
    Get structured data with Zod schemas
  </Card>
  
  <Card 
    title="Observe" 
    icon="eye" 
    href="/v3/basics/observe"
  >
    Discover available elements and actions
  </Card>
  
  <Card 
    title="Agent" 
    icon="robot" 
    href="/v3/basics/agent"
  >
    Autonomous multi-step browser workflows
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/convex/configuration.mdx
================================================
---
title: "Use Stagehand in Convex"
sidebarTitle: Configuration
description: "Set up AI-powered browser automation in your Convex application"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<Card
  title="Check out the convex-stagehand repo"
  icon="github"
  href="https://github.com/browserbase/convex-stagehand"
>
  Clone the [GitHub repo](https://github.com/browserbase/convex-stagehand) to get started with Stagehand in Convex.
</Card>

## Installation

Install the convex-stagehand component and Zod for schema validation:

```bash
npm install @browserbasehq/convex-stagehand zod
```

## Configuration

Add the Stagehand component to your `convex/convex.config.ts`:

```typescript convex/convex.config.ts
import { defineApp } from "convex/server";
import stagehand from "@browserbasehq/convex-stagehand/convex.config";

const app = defineApp();
app.use(stagehand, { name: "stagehand" });
export default app;
```

## Environment Variables

Set the following environment variables in your [Convex Dashboard](https://dashboard.convex.dev):

| Variable | Description |
|----------|-------------|
| `BROWSERBASE_API_KEY` | Your Browserbase API key |
| `BROWSERBASE_PROJECT_ID` | Your Browserbase project ID |
| `MODEL_API_KEY` | API key for your LLM provider (OpenAI, Anthropic, etc.) |

## Basic Usage

### Initialize the Client

Create a Stagehand instance in your Convex action:

```typescript convex/actions.ts
"use node";

import { Stagehand } from "@browserbasehq/convex-stagehand";
import { components } from "./_generated/api";
import { action } from "./_generated/server";
import { z } from "zod";

const stagehand = new Stagehand(components.stagehand, {
  browserbaseApiKey: process.env.BROWSERBASE_API_KEY!,
  browserbaseProjectId: process.env.BROWSERBASE_PROJECT_ID!,
  modelApiKey: process.env.MODEL_API_KEY!,
});
```

### Extract Data

Extract structured data from a web page using natural language instructions and Zod schemas:

```typescript
export const extractProducts = action({
  handler: async (ctx) => {
    const data = await stagehand.extract(ctx, {
      url: "https://example.com/products",
      instruction: "Extract all product names and prices",
      schema: z.object({
        products: z.array(z.object({
          name: z.string(),
          price: z.string(),
        }))
      })
    });

    return data.products;
  }
});
```

### Perform Actions

Execute browser interactions using plain English:

```typescript
export const loginToSite = action({
  handler: async (ctx) => {
    const result = await stagehand.act(ctx, {
      url: "https://example.com/login",
      action: "Click the login button and wait for the page to load"
    });

    return result;
  }
});
```

### Observe Elements

Identify interactive elements on a page:

```typescript
export const findNavLinks = action({
  handler: async (ctx) => {
    const actions = await stagehand.observe(ctx, {
      url: "https://example.com",
      instruction: "Find all clickable navigation links"
    });

    return actions;
  }
});
```

### Run Autonomous Tasks

Use the agent API for complex multi-step workflows:

```typescript
export const searchAndExtract = action({
  handler: async (ctx) => {
    const result = await stagehand.agent(ctx, {
      url: "https://google.com",
      instruction: "Search for 'convex database' and extract the top 3 results",
      options: { maxSteps: 10 }
    });

    return result;
  }
});
```

## Session Management

For workflows that span multiple operations, you can reuse browser sessions:

```typescript
export const multiStepWorkflow = action({
  handler: async (ctx) => {
    // Start a session
    const session = await stagehand.startSession(ctx, {
      url: "https://example.com",
      options: { timeout: 30000, waitUntil: "networkidle" }
    });

    // Perform multiple operations with the same session
    await stagehand.act(ctx, {
      sessionId: session.sessionId,
      action: "Click the login button"
    });

    const data = await stagehand.extract(ctx, {
      sessionId: session.sessionId,
      instruction: "Extract the user profile information",
      schema: z.object({
        name: z.string(),
        email: z.string(),
      })
    });

    // End the session
    await stagehand.endSession(ctx, { sessionId: session.sessionId });

    return data;
  }
});
```

Session persistence allows you to preserve authentication state and cookies between operations.

## Model Configuration

The default model is `openai/gpt-4o`. You can configure alternative providers:

```typescript
const stagehand = new Stagehand(components.stagehand, {
  browserbaseApiKey: process.env.BROWSERBASE_API_KEY!,
  browserbaseProjectId: process.env.BROWSERBASE_PROJECT_ID!,
  modelApiKey: process.env.ANTHROPIC_API_KEY!,
  modelName: "anthropic/claude-sonnet-4-5-20250929",
});
```

## Requirements

- Convex 1.29.3 or later
- A [Browserbase](https://browserbase.com) account with API credentials
- An API key from a supported LLM provider (OpenAI, Anthropic, etc.)

## References

<CardGroup cols={2}>
  <Card title="Source Code" icon="github" href="https://github.com/browserbase/convex-stagehand">
    Browse the complete repository on GitHub
  </Card>
  <Card title="Convex Docs" icon="book" href="https://docs.convex.dev">
    Learn more about Convex
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/convex/introduction.mdx
================================================
---
title: "Convex"
sidebarTitle: Introduction
description: "AI-powered browser automation for Convex applications"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

This guide shows you how to use Stagehand with Convex to create AI-powered browser automation within your Convex applications. By the end of this guide, you'll know how to:

- Set up the convex-stagehand component in your Convex app
- Extract structured data from web pages using natural language
- Execute browser actions via plain English instructions
- Build autonomous multi-step workflows with the agent API

## When You'd Use This

The Convex integration is perfect for scenarios where you need browser automation in serverless Convex functions:

- **Data extraction pipelines**: Extract structured data from websites and store it directly in your Convex database
- **Automated workflows**: Build background jobs that interact with web pages on behalf of users
- **Form automation**: Automatically fill out and submit forms based on data from your Convex app
- **Multi-step web processes**: Execute complex browser workflows that require decision-making and adaptation

The integration wraps the Stagehand REST API to provide Convex actions with the ability to control cloud browsers via Browserbase:

1. **Act**: Perform actions like clicking, typing, or navigating using natural language
2. **Extract**: Extract structured data from web pages with Zod schemas
3. **Observe**: Identify and analyze interactive elements on the page
4. **Agent**: Run autonomous multi-step tasks with AI decision-making

<CardGroup cols={2}>
  <Card title="Source Code" icon="github" href="https://github.com/browserbase/convex-stagehand">
    Browse the repository on GitHub
  </Card>
  <Card title="Convex Configuration" icon="gear" href="/v3/integrations/convex/configuration">
    Learn how to set up and configure convex-stagehand
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/crew-ai/configuration.mdx
================================================
---
title: "Use CrewAI to Automate Browser Tasks"
sidebarTitle: Configuration
description: "Create intelligent agents that can interact with websites and automate browser tasks using natural language instructions"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


This guide walks you through setting up CrewAI with Browserbase to create agents that can perform web automation tasks using natural language instructions.

## Step 1: Install Dependencies

Install the required packages for CrewAI and Stagehand integration:

```bash
pip install stagehand crewai crewai-tools
```

## Step 2: Configure Environment Variables

You'll need API keys from three services:

1. **Browserbase API Key and Project ID**: Get these from your [Browserbase dashboard](https://www.browserbase.com/)
2. **LLM API Key**: Get an API key from [OpenAI](https://platform.openai.com/api-keys) or [Anthropic](https://console.anthropic.com/)

Store your API keys securely as environment variables:

```bash
BROWSERBASE_API_KEY="your-browserbase-api-key"
BROWSERBASE_PROJECT_ID="your-browserbase-project-id"
OPENAI_API_KEY="your-openai-api-key"
ANTHROPIC_API_KEY="your-anthropic-api-key"
```

## Step 3: Create Your First Agent

Create a Python script with a basic CrewAI agent:

```python
import os
from crewai import Agent, Task, Crew
from crewai_tools import StagehandTool
from stagehand.schemas import AvailableModel

# Get API keys from environment
browserbase_api_key = os.environ.get("BROWSERBASE_API_KEY")
browserbase_project_id = os.environ.get("BROWSERBASE_PROJECT_ID")
model_api_key = os.environ.get("OPENAI_API_KEY")  # or ANTHROPIC_API_KEY

# Initialize the StagehandTool
stagehand_tool = StagehandTool(
    api_key=browserbase_api_key,
    project_id=browserbase_project_id,
    model_api_key=model_api_key,
    model_name=AvailableModel.GPT_4O,  # or AvailableModel.CLAUDE_3_7_SONNET_LATEST
)

# Create an agent with the tool
researcher = Agent(
    role="Web Researcher",
    goal="Find and summarize information from websites",
    backstory="I'm an expert at finding information online.",
    verbose=True,
    tools=[stagehand_tool],
)
```

## Step 4: Create and Run a Task

Define a task for your agent and execute it:

```python
# Create a task that uses the tool
research_task = Task(
    description="Go to https://www.example.com and tell me what you see on the homepage.",
    agent=researcher,
)

# Run the crew
crew = Crew(
    agents=[researcher],
    tasks=[research_task],
    verbose=True,
)

try:
    result = crew.kickoff()
    print(result)
finally:
    # Clean up resources
    stagehand_tool.close()
```

## Step 5: Run Your Script

Execute your Python script:

```bash
python your_crew_script.py
```

## Advanced Configuration

Customize the StagehandTool behavior with additional parameters:

```python
stagehand_tool = StagehandTool(
    api_key=browserbase_api_key,
    project_id=browserbase_project_id,
    model_api_key=model_api_key,
    model_name=AvailableModel.CLAUDE_3_7_SONNET_LATEST,
    dom_settle_timeout_ms=5000,  # Wait longer for DOM to settle
    headless=True,  # Run browser in headless mode
    self_heal=True,  # Attempt to recover from errors
    wait_for_captcha_solves=True,  # Wait for CAPTCHA solving
    verbose=1,  # Control logging verbosity (0-3)
)
```

## Example Tasks

<Tabs>
  <Tab title="Form Submission" value="form-submission" label="Python">
    ```python
    form_task = Task(
        description="""
        Submit a contact form:
        1. Go to https://example.com/contact
        2. Fill out the form with name 'John Doe', email 'john@example.com'
        3. Submit and confirm success
        """,
        agent=researcher,
    )
    ```
  </Tab>
  <Tab title="Data Extraction" value="data-extraction" label="Python">
    ```python
    extraction_task = Task(
        description="""
        Extract product information:
        1. Go to the products page
        2. Extract all product names, prices, and descriptions
        3. Format as structured data
        """,
        agent=researcher,
    )
    ```
  </Tab>
  <Tab title="Multi-step Navigation" value="multi-step-navigation" label="Python">
    ```python
    navigation_task = Task(
        description="""
        Navigate and analyze:
        1. Start at homepage
        2. Navigate to products section
        3. Filter by 'Electronics' category
        4. Find and extract details of highest-rated product
        """,
        agent=researcher,
    )
    ```
  </Tab>
</Tabs>

<CardGroup cols={2}>
  <Card title="CrewAI Documentation" icon="book" href="https://docs.crewai.com/">
    Dive into the CrewAI documentation to learn more about its capabilities and integrations.
  </Card>
  <Card title="Browserbase Documentation" icon="book" href="https://docs.browserbase.com/">
    Access the Browserbase documentation for comprehensive guides and resources.
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v3/integrations/crew-ai/introduction.mdx
================================================
---
title: "CrewAI Introduction"
sidebarTitle: Introduction
description: "Automate browser tasks using natural language instructions with CrewAI"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

This guide shows you how to use CrewAI with Browserbase to create intelligent agents that can automate web interactions. By the end of this guide, you'll know how to:

- Set up CrewAI with the StagehandTool
- Create agents that can interact with websites
- Automate browser tasks using natural language instructions
- Extract structured data from web pages

## When You'd Use This

The CrewAI integration is perfect for scenarios where you need intelligent web automation:

- **Research automation**: Have agents research information across multiple websites
- **Data collection**: Extract structured data from e-commerce sites, job boards, or news sites
- **Form automation**: Automatically fill out and submit forms based on specific criteria
- **Multi-step workflows**: Execute complex browser workflows that require decision-making

The StagehandTool wraps the Stagehand Python SDK to provide CrewAI agents with the ability to control a real web browser and interact with websites using three core primitives:

1. **Act**: Perform actions like clicking, typing, or navigating
2. **Extract**: Extract structured data from web pages
3. **Observe**: Identify and analyze elements on the page

<CardGroup cols={1}>
<Card title="CrewAI Configuration" icon="gear" href="/v3/integrations/crew-ai/configuration">
  Learn how to configure and use the StagehandTool with CrewAI agents for web automation tasks
</Card>
</CardGroup>

================================================
FILE: packages/docs/v3/integrations/langchain/configuration.mdx
================================================
---
title: "LangChain JS Configuration"
sidebarTitle: Configuration
description: "Set up Stagehand with LangChain JS to create intelligent web automation agents"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


This guide walks you through integrating Stagehand with LangChain JS to build powerful web automation workflows using natural language instructions.

## Step 1: Install Dependencies

Install the required packages for LangChain JS and Stagehand integration:

```bash
npm install @langchain/langgraph @langchain/community @langchain/core @browserbasehq/stagehand
```

## Step 2: Configure Environment Variables

For remote browser automation, set up your Browserbase credentials:

```bash
BROWSERBASE_API_KEY="your-browserbase-api-key"
BROWSERBASE_PROJECT_ID="your-browserbase-project-id"
```

## Step 3: Create a Stagehand Instance

Initialize Stagehand with your preferred configuration:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// For local development
const stagehand = new Stagehand({
    env: "LOCAL",
    verbose: 2,
    enableCaching: false,
});

// For production with Browserbase
const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 1,
    enableCaching: true,
});
```

## Step 4: Generate the StagehandToolkit

Create the toolkit that provides LangChain-compatible tools:

```typescript
import { StagehandToolkit } from '@langchain/community/agents/toolkits/stagehand';

const stagehandToolkit = await StagehandToolkit.fromStagehand(stagehand);
```

## Step 5: Use Individual Tools

The toolkit provides four specialized tools for web automation:

### Available Tools

- **stagehand_navigate**: Navigate to specific URLs
- **stagehand_act**: Perform browser actions (clicking, typing, etc.)
- **stagehand_extract**: Extract structured data using schemas  
- **stagehand_observe**: Analyze page elements and possible actions

### Basic Tool Usage

```typescript
import { z } from "zod";

// Navigate to a website
const navigateTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_navigate"
);
await navigateTool.invoke("https://www.google.com");

// Perform an action
const actionTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_act"
);
await actionTool.invoke('Search for "OpenAI"');

// Observe the page
const observeTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_observe"
);
const result = await observeTool.invoke(
    "What actions can be performed on the current page?"
);
console.log(JSON.parse(result));

// Extract structured data
const extractTool = stagehandToolkit.tools.find(
    (t) => t.name === "stagehand_extract"
);
const extractResult = await extractTool.invoke({
    instruction: "Extract the main heading and description",
    schema: z.object({
        heading: z.string(),
        description: z.string(),
    }),
});
console.log(extractResult);
```

## Step 6: Build LangGraph Agents

Integrate with LangGraph for complex automation workflows:

```typescript
import { createReactAgent } from "@langchain/langgraph/prebuilt";

// Create an LLM
const llm = new ChatOpenAI({
    model: "gpt-4",
    temperature: 0,
});

// Create an agent with Stagehand tools
const agent = createReactAgent({
    llm,
    tools: stagehandToolkit.tools,
});

// Execute a complex workflow
const result = await agent.invoke({
    messages: [
        {
            role: "user", 
            content: "Go to example.com, find the contact form, and extract all the form fields"
        }
    ]
});
```

## Advanced Configuration

### Custom Stagehand Configuration

```typescript
const stagehand = new Stagehand({
    env: "BROWSERBASE",
    verbose: 2,
    enableCaching: true,
    headless: true,
    domSettleTimeoutMs: 5000,
});
```

### Error Handling

```typescript
try {
    const result = await agent.invoke({
        messages: [{ role: "user", content: "Navigate to invalid-url.com" }]
    });
} catch (error) {
    console.error("Automation failed:", error);
} finally {
    // Clean up resources
    await stagehand.close();
}
```

## Example Workflows

<Tabs>
  <Tab title="Data Extraction" value="data-extraction" label="TypeScript">
    ```typescript
    const extractionAgent = createReactAgent({
        llm,
        tools: stagehandToolkit.tools,
    });

    const result = await extractionAgent.invoke({
        messages: [{
            role: "user",
            content: `
                Go to news-website.com and extract:
                1. All article headlines
                2. Publication dates  
                3. Author names
                Format as structured JSON
            `
        }]
    });
    ```
  </Tab>
  <Tab title="Form Automation" value="form-automation" label="TypeScript">
    ```typescript
    const formAgent = createReactAgent({
        llm,
        tools: stagehandToolkit.tools,
    });

    const result = await formAgent.invoke({
        messages: [{
            role: "user", 
            content: `
                Navigate to contact-form.com and:
                1. Fill out the contact form with:
                   - Name: John Doe
                   - Email: john@example.com
                   - Message: Inquiry about services
                2. Submit the form
                3. Confirm submission success
            `
        }]
    });
    ```
  </Tab>
  <Tab title="Multi-site Research" value="multi-site-research" label="TypeScript">
    ```typescript
    const researchAgent = createReactAgent({
        llm,
        tools: stagehandToolkit.tools,
    });

    const result = await researchAgent.invoke({
        messages: [{
            role: "user",
            content: `
                Research product pricing by:
                1. Visit competitor1.com and extract pricing info
                2. Visit competitor2.com and extract pricing info  
                3. Compare features and prices
                4. Provide summary analysis
            `
        }]
    });
    ```
  </Tab>
</Tabs>

<CardGroup cols={1}>
  <Card title="LangChain JS Documentation" icon="book" href="https://js.langchain.com/docs/integrations/tools/stagehand/">
    Official LangChain JS documentation for the Stagehand integration
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v3/integrations/langchain/introduction.mdx
================================================
---
title: "Langchain JS Introduction"
sidebarTitle: Introduction
description: "Integrate Stagehand with Langchain JS for intelligent web automation"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

This guide shows you how to use Stagehand with Langchain JS to create intelligent agents that can automate web interactions. By the end of this guide, you'll know how to:

- Set up the StagehandToolkit with Langchain JS
- Create agents that can navigate and interact with websites
- Extract structured data using natural language instructions
- Build complex automation workflows with LangGraph

## When You'd Use This

The Langchain JS integration is perfect for scenarios where you need intelligent web automation with advanced reasoning:

- **AI-driven research**: Create agents that can research information across multiple websites and synthesize findings
- **Dynamic form filling**: Automatically fill out complex forms based on contextual requirements
- **Data extraction workflows**: Extract and transform data from multiple sources with intelligent navigation
- **Multi-step web processes**: Execute complex browser workflows that require decision-making and adaptation

<CardGroup cols={1}>
<Card title="Langchain JS Configuration" icon="gear" href="/v3/integrations/langchain/configuration">
  Learn how to set up and configure the StagehandToolkit with Langchain JS agents
</Card>
</CardGroup>

================================================
FILE: packages/docs/v3/integrations/mcp/configuration.mdx
================================================
---
title: "Browserbase MCP Server Configuration"
sidebarTitle: "Configuration"
description: "Configure your browser automation with command-line flags, environment variables, and advanced options"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Configuration Overview

The Browserbase MCP server supports extensive configuration options through command-line flags and environment variables. Configure browser behavior, proxy settings, stealth modes, model selection, and more to customize your browser automation workflows.

<Note>
Command-line flags are only available when running the server locally (`npx @browserbasehq/mcp-server-browserbase` with flags or local development setup).
</Note>

## Environment Variables

Configure the essential Browserbase credentials and optional debugging settings:

<CardGroup cols={2}>
<Card title="BROWSERBASE_API_KEY" icon="key">
Your Browserbase API key for authentication
</Card>

<Card title="BROWSERBASE_PROJECT_ID" icon="key">
Your Browserbase project ID
</Card>

</CardGroup>

## Command-Line Flags

### Available Flags

| Flag | Description |
|------|-------------|
| `--proxies` | Enable Browserbase proxies for the session |
| `--advancedStealth` | Enable Browserbase Advanced Stealth (Scale Plan only) |
| `--keepAlive` | Enable Browserbase Keep Alive Session |
| `--contextId <contextId>` | Specify a Browserbase Context ID to use |
| `--persist [boolean]` | Whether to persist the Browserbase context (default: true) |
| `--port <port>` | Port to listen on for HTTP/SHTTP transport |
| `--host <host>` | Host to bind server to (default: localhost, use 0.0.0.0 for all interfaces) |
| `--browserWidth <width>` | Browser viewport width (default: 1024) |
| `--browserHeight <height>` | Browser viewport height (default: 768) |
| `--modelName <model>` | The model to use for Stagehand (default: google/gemini-2.5-flash-lite) |
| `--modelApiKey <key>` | API key for the custom model provider (required when using custom models) |
| `--experimental` | Enable experimental features (default: false) |

## Configuration Examples

### Basic Configuration

<Tabs>
<Tab title="Remote URL (SHTTP)">


<CodeGroup>
```json Direct SHTTP
{
  "mcpServers": {
    "browserbase": {
      "url": "your-smithery-url.com"
    }
  }
}
```
</CodeGroup>

When using our remote hosted server, we provide the LLM costs for Gemini, the [best performing model](https://www.stagehand.dev/evals) in [Stagehand](https://www.stagehand.dev).
</Tab>

<Tab title="NPM Package">

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Local STDIO">
```json
{
  "mcpServers": {
    "browserbase": {
      "command": "node",
      "args": ["/path/to/mcp-server-browserbase/cli.js"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Local SHTTP">
```bash
# Start server
node cli.js --port 8931
```

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "http://localhost:8931/mcp",
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>

### Advanced Features

<Tabs>
<Tab title="Proxies">
Enable Browserbase proxies for IP rotation and geo-location testing.

<Panel>
[Learn more about Browserbase Proxies](https://docs.browserbase.com/features/proxies)
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase", "--proxies"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Advanced Stealth">
Enable advanced anti-detection features for enhanced stealth browsing.

<Panel>
[Learn more about Advanced Stealth](https://docs.browserbase.com/features/stealth-mode#advanced-stealth-mode)

**Note:** Advanced Stealth is only available for Scale Plan users.
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase", "--advancedStealth"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Contexts">
Use persistent browser contexts to maintain authentication and state across sessions.

<Panel>
[Learn more about Browserbase Contexts](https://docs.browserbase.com/features/contexts)
</Panel>

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase", "--contextId", "your_context_id"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id"
      }
    }
  }
}
```
</Tab>
</Tabs>

### Browser Customization

<Tabs>
<Tab title="Viewport Sizing">
Customize browser window dimensions. Default is 1288x711. Recommended aspect ratios: 16:9.

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--browserWidth", "1920",
        "--browserHeight", "1080"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```

**Common Resolutions:**
- Desktop: 1920x1080, 1280x720, 1024x768
- Mobile: 375x667 (iPhone), 360x640 (Android)
- Tablet: 768x1024 (iPad)
</Tab>

</Tabs>

## Model Configuration

Configure AI models for enhanced browser automation. Stagehand defaults to Google's Gemini 2.5 Flash Lite but supports multiple providers.

<Warning>
When using any custom model (non-default), you must provide your own API key for that model provider using the `--modelApiKey` flag.
</Warning>

<Tabs>
<Tab title="Available Models">
**Google Gemini** (Default)
- `google/gemini-2.5-flash-lite` (default)
- `google/gemini-2.5-pro`
- `google/gemini-2.5-flash`

**OpenAI**
- `gpt-5-2025-08-07`
- `gpt-4.1-2025-04-14`
- `gpt-4o`
- `gpt-4o-mini`

**Anthropic Claude**
- `claude-sonnet-4-5`
- `claude-haiku-4-5`

[View full list of supported models](https://docs.stagehand.dev/v3/configuration/models#models)
</Tab>

<Tab title="Configuration Examples">
<CodeGroup>
```json OpenAI GPT-4o
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--modelName", "gpt-4o",
        "--modelApiKey", "your_openai_api_key"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id"
      }
    }
  }
}
```

```json Claude Sonnet
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--modelName", "claude-sonnet-4-6",
        "--modelApiKey", "your_anthropic_api_key"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id"
      }
    }
  }
}
```
</CodeGroup>
</Tab>
</Tabs>

## Development Configuration

<Tabs>
<Tab title="Custom Host/Port">
Configure custom host and port for SHTTP transport.

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": [
        "@browserbasehq/mcp-server-browserbase",
        "--host", "0.0.0.0",
        "--port", "8080"
      ],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "BROWSERBASE_PROJECT_ID": "your_project_id",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>

## Best Practices

<Accordion title="Performance - How can I optimize browser automation performance?">
- Use appropriate viewport sizes for your use case
- Enable proxies only when needed for geo-location
- Choose efficient models (Gemini Flash for speed, GPT-4o for accuracy)
- Reuse contexts for authentication persistence
</Accordion>

<Accordion title="Security - What security measures should I implement?">
- Store API keys securely in environment variables
- Use Advanced Stealth for sensitive operations
- Implement proper session management
- Rotate cookies and contexts regularly
</Accordion>

<Accordion title="Development - What are the recommended development practices?">
- Enable debug mode during development
- Use context persistence for faster iteration
- Test with different viewport sizes
- Monitor session usage and quotas
</Accordion>

<Accordion title="Production - How should I configure for production environments?">
- Use NPM installation for reliability
- Configure appropriate timeouts
- Implement error handling and retries
- Monitor performance and resource usage
</Accordion>

## Further Reading

<CardGroup cols={3}>
<Card title="Browserbase Documentation" icon="globe" href="https://docs.browserbase.com">
Complete platform documentation
</Card>

<Card title="Stagehand Docs" icon="robot" href="https://docs.stagehand.dev/">
AI-powered browser automation
</Card>

<Card title="Support" icon="headset" href="mailto:support@browserbase.com">
Get help from our team
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/mcp/introduction.mdx
================================================
---
title: "Browserbase MCP Server"
sidebarTitle: "Introduction"
description: "AI-powered browser automation through Model Context Protocol integration with Stagehand"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />

## Overview

The Browserbase MCP Server brings powerful browser automation capabilities to MCP clients through the Model Context Protocol (MCP). Built on top of [Stagehand](https://docs.stagehand.dev/), this integration provides AI-powered web automation using natural language commands.

<Info>
  The hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http)
  endpoint is served on Browserbase infrastructure.
  You can also run the MCP server locally with STDIO, but we recommend the
  hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http)
  endpoint for most users.
</Info>

## Key Features

<CardGroup cols={2}>
<Card title="Natural Language Automation" icon="wand-magic-sparkles">
Control browsers using plain English commands like "click the login button" or "fill out the contact form"
</Card>

<Card title="Web Interaction" icon="browser">
  Navigate, click, and fill forms with ease
</Card>

<Card title="Data Extraction" icon="download">
  Extract structured data from any website automatically
</Card>

<Card title="Session Lifecycle" icon="route">
  Create, reuse, and close browser sessions with explicit MCP tools
</Card>

</CardGroup>

## Core Benefits

<Tabs>
<Tab title="Ease of Use">
<CardGroup cols={2}>
<Card title="Intuitive Commands" icon="wand-magic-sparkles">
No need to learn complex selectors or automation syntax. Simply describe what you want to do in natural language.
</Card>

<Card title="Quick Setup" icon="rocket">
  Get started in minutes with either hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) or local STDIO.
</Card>

<Card title="Smart Automation" icon="brain">
Stagehand's AI understands web page context and can adapt to different layouts and designs.
</Card>
</CardGroup>
</Tab>

<Tab title="Powerful Capabilities">
<CardGroup cols={2}>
<Card title="Full Browser Control" icon="browser">
Navigate, click, type, scroll, and interact with any web element.
</Card>

<Card title="Data Intelligence" icon="chart-line">
  Extract structured information from complex web pages automatically.
</Card>

<Card title="Session Persistence" icon="cookie-bite">
Maintain authentication states and cookies across multiple interactions.
</Card>
</CardGroup>
</Tab>

<Tab title="Enterprise Ready">
<CardGroup cols={2}>
<Card title="Reliable Infrastructure" icon="server">
Hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) runs on Browserbase infrastructure for consistent performance.
</Card>

<Card title="Scalable Architecture" icon="arrows-up-to-line">
  Handle multiple concurrent sessions and high-volume automation tasks.
</Card>

<Card title="Security Features" icon="shield-check">
  Stealth mode, proxy support, and advanced anti-detection capabilities.
</Card>

<Card title="Comprehensive Logging" icon="file-lines">
Detailed session recordings and debugging information.
</Card>
</CardGroup>
</Tab>
</Tabs>

## Use Cases

<Tabs>
<Tab title="Web Scraping & Data Collection">
<CardGroup cols={2}>
<Card title="E-commerce Monitoring" icon="store">
Track product prices, availability, and competitor information
</Card>

<Card title="Market Research" icon="chart-bar">
  Gather data from multiple sources for analysis and reporting
</Card>

<Card title="Content Aggregation" icon="newspaper">
  Collect articles, posts, and media from various websites
</Card>

<Card title="Lead Generation" icon="users">
Extract contact information and business data from directories
</Card>
</CardGroup>
</Tab>

<Tab title="Testing">
<CardGroup cols={2}>
<Card title="Automated Testing" icon="flask">
Create comprehensive test suites for web applications
</Card>

<Card title="Cross-Browser Validation" icon="browsers">
  Test functionality across different browser environments
</Card>

<Card title="User Journey Testing" icon="route">
  Simulate real user interactions and workflows
</Card>

<Card title="Performance Monitoring" icon="gauge">
Track page load times and user experience metrics
</Card>
</CardGroup>
</Tab>

<Tab title="Workflow Automation">
<CardGroup cols={2}>
<Card title="Form Automation" icon="file-contract">
Automatically fill and submit complex web forms
</Card>

<Card title="Report Generation" icon="chart-line">
  Extract data and generate automated reports
</Card>

<Card title="Social Media Management" icon="share-nodes">
  Schedule posts and monitor engagement across platforms
</Card>

<Card title="Administrative Tasks" icon="clipboard-check">
Automate repetitive web-based business processes
</Card>
</CardGroup>
</Tab>
</Tabs>

## Getting Started

<Steps>
<Step title="Install the MCP Server">
Choose hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) (recommended) or local STDIO based on your needs.
</Step>

<Step title="Configure Authentication">
  Set up your Browserbase API credentials in MCP configuration. Get API keys
  from the [Browserbase Dashboard](https://www.browserbase.com/overview).
</Step>

<Step title="Start Automating">
Begin using natural language commands to control browsers through your MCP client.
</Step>
</Steps>

<Tip>
  Ready to get started? Check out the [Setup Guide](/v3/integrations/mcp/setup).
</Tip>

## Further Reading

<CardGroup cols={3}>
<Card title="Setup Guide" icon="rocket" href="/v3/integrations/mcp/setup">
Get started with installation and configuration
</Card>

<Card title="MCP Docs" icon="book" href="https://modelcontextprotocol.io/introduction">
Learn more about the MCP protocol
</Card>

<Card title="Browserbase Docs" icon="globe" href="https://docs.browserbase.com">
Explore Browserbase features and capabilities
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/mcp/setup.mdx
================================================
---
title: "Browserbase MCP Server Setup"
sidebarTitle: "Setup"
description: "Add the Browserbase MCP Server to your MCP client"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />

## Quick Installation

<Card title="Install with Cursor" icon="arrow-pointer" href="cursor://anysphere.cursor-deeplink/mcp/install?name=browserbase&config=eyJ1cmwiOiJodHRwczovL21jcC5icm93c2VyYmFzZS5jb20vbWNwP2Jyb3dzZXJiYXNlQXBpS2V5PVlPVVJfQlJPV1NFUkJBU0VfQVBJX0tFWSJ9">
  One-click installation directly in Cursor
</Card>

You can also add Browserbase MCP to Claude Code with a single command:

```bash
claude mcp add --transport http browserbase "https://mcp.browserbase.com/mcp?browserbaseApiKey=YOUR_BROWSERBASE_API_KEY"
```

We support both local STDIO and hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) (SHTTP). We recommend hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) for most users.

## Endpoint

Hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) endpoint (served on Browserbase infrastructure):

```text
https://mcp.browserbase.com/mcp
```

## Prerequisites

<Steps>
<Step title="Get your Browserbase credentials">
Get your Browserbase API key from the [Browserbase Dashboard](https://www.browserbase.com/overview).

<Frame>
<img src="/images/quickstart/api-key.png" alt="Browserbase API Key settings" />
</Frame>

Then copy your API Key directly from the input.
</Step>
</Steps>

## Query Parameters (Hosted [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http))

### Required for tool calls

<CardGroup cols={1}>
<Card title="browserbaseApiKey" icon="key">
Browserbase API key.
</Card>
</CardGroup>

### Optional

| Query Param       | Type           | Behavior                                   |
| ----------------- | -------------- | ------------------------------------------ |
| `modelName`       | string         | Defaults to `google/gemini-2.5-flash-lite` |
| `modelApiKey`     | string         | Required when `modelName` is non-default   |
| `keepAlive`       | boolean string | `"true"` or `"false"`                      |
| `proxies`         | boolean string | `"true"` or `"false"`                      |
| `advancedStealth` | boolean string | `"true"` or `"false"`                      |

<Warning>
  Boolean query values must be exact strings: `"true"` or `"false"`.
</Warning>

## Available Tools

<Accordion title="navigate">
Navigate to any URL in the browser

<ParamField path="url" type="string" required>
  The URL to navigate to
</ParamField>
</Accordion>

<Accordion title="act">
Perform an action on the web page using natural language

<ParamField path="action" type="string" required>
  The action to perform (e.g., "click the login button", "fill form field")
</ParamField>
</Accordion>

<Accordion title="observe">
Observe and find actionable elements on the page.

<ParamField path="instruction" type="string" required>
  Specific instruction for observation (e.g., "find the login button", "locate search form")
</ParamField>
</Accordion>

<Accordion title="extract">
Extract data from the current page.

<ParamField path="instruction" type="string">
Optional extraction instruction.
</ParamField>
</Accordion>

<Accordion title="start">
Create or reuse a Browserbase session and set it as active for the current MCP transport session.

<Info>No input parameters required.</Info>

<ResponseField name="sessionId" type="string">
Browserbase session ID.
</ResponseField>
</Accordion>

<Accordion title="end">
Close the active Browserbase session for the current MCP transport session.

<Info>No input parameters required.</Info>
</Accordion>

## Local Command-Line Flags

<Note>
Command-line flags are only available when running the server locally (`npx @browserbasehq/mcp-server-browserbase` with flags or local development setup).
</Note>

| Flag | Description |
|------|-------------|
| `--proxies` | Enable Browserbase proxies for the session |
| `--advancedStealth` | Enable Browserbase Advanced Stealth (Scale Plan only) |
| `--keepAlive` | Enable Browserbase Keep Alive Session |
| `--contextId <contextId>` | Specify a Browserbase Context ID to use |
| `--persist [boolean]` | Whether to persist the Browserbase context (default: true) |
| `--port <port>` | Port to listen on for HTTP or [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http) transport |
| `--host <host>` | Host to bind server to (default: localhost, use 0.0.0.0 for all interfaces) |
| `--browserWidth <width>` | Browser viewport width (default: 1024) |
| `--browserHeight <height>` | Browser viewport height (default: 768) |
| `--modelName <model>` | The model to use for Stagehand (default: google/gemini-2.5-flash-lite) |
| `--modelApiKey <key>` | API key for the custom model provider (required when using custom models) |
| `--experimental` | Enable experimental features (default: false) |

## Installation Methods

<Tabs>
<Tab title="Hosted (recommended)">

Use your MCP client config:

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "https://mcp.browserbase.com/mcp?browserbaseApiKey=YOUR_BROWSERBASE_API_KEY"
    }
  }
}
```

For custom models, include `modelName` and `modelApiKey`:

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "https://mcp.browserbase.com/mcp?browserbaseApiKey=YOUR_BROWSERBASE_API_KEY&modelName=openai/gpt-4.1&modelApiKey=YOUR_MODEL_API_KEY"
    }
  }
}
```

</Tab>

<Tab title="NPM Package (STDIO)">
The easiest way to get started locally is using our NPM package.

<Note>
If you would like to use a different model, you have to pass the model name and keys in the args. More info in the [Local Command-Line Flags](#local-command-line-flags) section.
</Note>

<Steps>
<Step title="Add to MCP Config">
Go into your MCP Config JSON and add the Browserbase Server:

<CodeGroup>
```json Claude Desktop
{
  "mcpServers": {
    "browserbase": {
      "command": "npx",
      "args": ["@browserbasehq/mcp-server-browserbase"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</CodeGroup>
</Step>

<Step title="Restart your MCP client">
<Check>
That's it! Reload your MCP client and you will be able to use Browserbase.
</Check>
</Step>
</Steps>

</Tab>

<Tab title="Local Development">
For local development or customization, you can run the server locally.

<Steps>
<Step title="Clone and build">
```bash
# Clone the Repo
git clone https://github.com/browserbase/mcp-server-browserbase.git
cd mcp-server-browserbase

# Install the dependencies and build the project
npm install && npm run build
```
</Step>

<Step title="Choose your transport method">
You can run locally using either STDIO or [Streamable HTTP](https://modelcontextprotocol.io/specification/2025-03-26/basic/transports#streamable-http).

<Tabs>
<Tab title="STDIO">
Add the following to your MCP Config JSON file:

```json
{
  "mcpServers": {
    "browserbase": {
      "command": "node",
      "args": ["/path/to/mcp-server-browserbase/cli.js"],
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>

<Tab title="Self-hosted Streamable HTTP">
First, run the server:

```bash
node cli.js --port 8931
```

Then add this to your MCP Config JSON file:

```json
{
  "mcpServers": {
    "browserbase": {
      "url": "http://localhost:8931/mcp",
      "env": {
        "BROWSERBASE_API_KEY": "your_api_key",
        "GEMINI_API_KEY": "your_gemini_api_key"
      }
    }
  }
}
```
</Tab>
</Tabs>
</Step>

<Step title="Restart your client">
<Check>
Reload your MCP client and you should be good to go!
</Check>
</Step>
</Steps>
</Tab>
</Tabs>

## Verify Installation

<Steps>
<Step title="Restart your MCP client">
Restart/refresh your MCP client app and verify tools are available.
</Step>

<Step title="Test the integration">
Get started using our MCP Server by asking your MCP client to navigate to any page and see your Browserbase Browser in action on the [dashboard](https://www.browserbase.com/sessions).

<Tip>
Try: "Navigate to example.com and extract the main heading"
</Tip>
</Step>
</Steps>

## Further Reading

<CardGroup cols={3}>
<Card title="Model Context Protocol (MCP) Docs" icon="book" href="https://modelcontextprotocol.io/introduction">
Learn more about the MCP protocol
</Card>

<Card title="Browserbase Documentation" icon="globe" href="https://docs.browserbase.com">
Explore Browserbase features and capabilities
</Card>

<Card title="Support" icon="headset" href="mailto:support@browserbase.com">
Get help from our support team
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/mcp/tools.mdx
================================================
---
title: "Browserbase MCP Server Tools"
sidebarTitle: "Tools"
description: "This guide covers the specialized tools available in the Browserbase MCP server for browser automation and interaction."
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

The Browserbase MCP server provides tools for browser automation and session management through a transport-scoped active session.

## Core Browser Automation Tools

These are the primary tools for modern web automation using natural language commands.

<Accordion title="navigate">
Navigate to any URL in the browser

<ParamField path="url" type="string" required>
  The URL to navigate to
</ParamField>
</Accordion>

<Accordion title="act">
Perform an action on the web page using natural language

<ParamField path="action" type="string" required>
  The action to perform (e.g., "click the login button", "fill form field")
</ParamField>

</Accordion>

<Accordion title="observe">
Observe and find actionable elements on the page.

<ParamField path="instruction" type="string" required>
  Specific instruction for observation (e.g., "find the login button", "locate search form")
</ParamField>
</Accordion>

<Accordion title="extract">
Extract data from the current page.

<ParamField path="instruction" type="string">
  Optional extraction instruction.
</ParamField>
</Accordion>

## Session Management

<Accordion title="start">
Create or reuse a Browserbase session and set it as active for the current MCP transport session.

<Info>No input parameters required.</Info>

<ResponseField name="sessionId" type="string">
  Browserbase session ID.
</ResponseField>
</Accordion>

<Accordion title="end">
Close the active Browserbase session for the current MCP transport session.

<Info>No input parameters required.</Info>
</Accordion>

## Further Reading

<CardGroup cols={3}>
<Card title="Model Context Protocol (MCP) Docs" icon="book" href="https://modelcontextprotocol.io/introduction">
Learn more about the MCP protocol
</Card>

<Card title="Stagehand Documentation" icon="robot" href="https://docs.stagehand.dev/">
Explore Stagehand's AI-powered browser automation
</Card>

<Card title="Support" icon="headset" href="mailto:support@browserbase.com">
Get help from our support team
</Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/playwright.mdx
================================================
---
title: Playwright
description: Use Stagehand with Playwright for browser automation
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

Stagehand v3 can work seamlessly with Playwright, allowing you to use Playwright's `Page` objects directly with Stagehand's AI-powered methods like `act()`, `extract()`, and `observe()`.

## Installation

First, install both Stagehand and Playwright:

```bash
npm install @browserbasehq/stagehand playwright-core
```

## Quickstart

### Basic Setup

Connect Playwright to Stagehand's browser instance using Chrome DevTools Protocol (CDP):

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { chromium } from "playwright-core";

const stagehand = new Stagehand({
  env: "BROWSERBASE", // or "LOCAL"
  model: "openai/gpt-5",
});

await stagehand.init();

// Connect Playwright to Stagehand's browser
const browser = await chromium.connectOverCDP({
  wsEndpoint: stagehand.connectURL(),
});

const pwContext = browser.contexts()[0];
const pwPage = pwContext.pages()[0];
```

### Using Playwright Pages with Stagehand

Once connected, you can use Playwright's `Page` objects with Stagehand's AI-powered methods:

```typescript
// Navigate using Playwright
await pwPage.goto("https://example.com");

// Use Stagehand's AI methods with the Playwright page
await stagehand.act("click the login button", { page: pwPage });

const data = await stagehand.extract(
  "extract the article title",
  z.object({ title: z.string() }),
  { page: pwPage }
);
```

## Multi-Page Example

Stagehand works great with multiple Playwright pages:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { chromium } from "playwright-core";
import { z } from "zod";

// Initialize Stagehand
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "openai/gpt-5",
});

await stagehand.init();

// Connect Playwright
const browser = await chromium.connectOverCDP({
  wsEndpoint: stagehand.connectURL(),
});

const pwContext = browser.contexts()[0];
const pwPage1 = pwContext.pages()[0];

// Create a second page
const pwPage2 = await pwContext.newPage();

// Navigate both pages
await pwPage1.goto("https://docs.stagehand.dev/first-steps/introduction");
await pwPage2.goto("https://docs.stagehand.dev/configuration/observability");

// Extract data from both pages concurrently
const [page1Data, page2Data] = await Promise.all([
  stagehand.extract(
    "extract the names of the four stagehand primitives",
    z.array(z.string()),
    { page: pwPage1 }
  ),
  stagehand.extract(
    "extract the list of session dashboard features",
    z.array(z.string()),
    { page: pwPage2 }
  ),
]);

console.log("Page 1 primitives:", page1Data);
console.log("Page 2 features:", page2Data);
```

## Complete Example

Here's a full working example:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { chromium } from "playwright-core";
import { z } from "zod";

async function main() {
  // Initialize Stagehand
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    model: "openai/gpt-5",
    verbose: 1,
  });

  await stagehand.init();
  console.log("Stagehand initialized");

  // Connect Playwright to Stagehand's browser
  const browser = await chromium.connectOverCDP({
    wsEndpoint: stagehand.connectURL(),
  });

  const pwContext = browser.contexts()[0];
  const pwPage = pwContext.pages()[0];

  // Navigate and interact
  await pwPage.goto("https://example.com");

  // Use Stagehand's AI methods
  const actions = await stagehand.observe("find the main heading", {
    page: pwPage,
  });

  console.log("Found actions:", actions);

  // Extract data
  const heading = await stagehand.extract(
    "extract the main heading text",
    z.object({ heading: z.string() }),
    { page: pwPage }
  );

  console.log("Heading:", heading);

  // Cleanup
  await stagehand.close();
}

main();
```

## Key Points

- **Connect via CDP**: Use `chromium.connectOverCDP()` with `stagehand.connectURL()` as the WebSocket endpoint
- **Pass the page**: Always pass the Playwright `page` object to Stagehand methods using the `{ page }` option
- **Multi-page support**: Create multiple pages with `pwContext.newPage()` and pass them to Stagehand methods
- **Concurrent operations**: Use `Promise.all()` to run multiple Stagehand operations in parallel across different pages

## Environment Variables

When using Browserbase, set your credentials:

```bash
BROWSERBASE_API_KEY=your_api_key
BROWSERBASE_PROJECT_ID=your_project_id
```

For OpenAI (or other providers):

```bash
OPENAI_API_KEY=your_api_key
```

## Next Steps

<CardGroup cols={2}>
  <Card title="Agent" icon="robot" href="/v3/references/agent">
    Automate entire workflows
  </Card>
  <Card title="Act" icon="play" href="/v3/references/act">
    Execute actions on web pages
  </Card>
  <Card title="Extract" icon="ufo-beam" href="/v3/references/extract">
    Extract structured data from pages
  </Card>
  <Card title="Observe" icon="eye" href="/v3/references/observe">
    Observe and find elements on pages
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/puppeteer.mdx
================================================
---
title: Puppeteer
description: Use Stagehand with Puppeteer for browser automation
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

Stagehand v3 can work seamlessly with Puppeteer, allowing you to use Puppeteer's `Page` objects directly with Stagehand's AI-powered methods like `act()`, `extract()`, and `observe()`.

## Installation

First, install both Stagehand and Puppeteer:

```bash
npm install @browserbasehq/stagehand puppeteer-core
```

## Quickstart

### Basic Setup

Connect Puppeteer to Stagehand's browser instance:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import puppeteer from "puppeteer-core";

const stagehand = new Stagehand({
  env: "LOCAL", // or "BROWSERBASE"
  model: "openai/gpt-5",
});

await stagehand.init();

// Connect Puppeteer to Stagehand's browser
const browser = await puppeteer.connect({
  browserWSEndpoint: stagehand.connectURL(),
  defaultViewport: null,
});

const pages = await browser.pages();
const ppPage = pages[0];
```

### Using Puppeteer Pages with Stagehand

Once connected, you can use Puppeteer's `Page` objects with Stagehand's AI-powered methods:

```typescript
// Navigate using Puppeteer
await ppPage.goto("https://example.com");

// Use Stagehand's AI methods with the Puppeteer page
await stagehand.act("click the sign in button", { page: ppPage });

const data = await stagehand.extract(
  "extract the page title",
  z.object({ title: z.string() }),
  { page: ppPage }
);
```

## Advanced: Multi-Page Usage

Create and manage multiple Puppeteer pages with Stagehand:

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import puppeteer from "puppeteer-core";
import { z } from "zod";

async function multiPageExample() {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    model: "openai/gpt-5",
  });

  await stagehand.init();

  // Connect Puppeteer
  const browser = await puppeteer.connect({
    browserWSEndpoint: stagehand.connectURL(),
    defaultViewport: null,
  });

  // Get the first page
  const pages = await browser.pages();
  const ppPage1 = pages[0];

  // Create a second page
  const ppPage2 = await browser.newPage();

  // Navigate both pages
  await ppPage1.goto("https://example.com");
  await ppPage2.goto("https://another-site.com");

  // Use Stagehand on different pages
  await stagehand.act("click the button", { page: ppPage1 });

  const data = await stagehand.extract(
    "extract the title",
    z.object({ title: z.string() }),
    { page: ppPage2 }
  );

  console.log("Extracted from page 2:", data);

  await stagehand.close();
}
```

## Observe + Act Pattern

The recommended pattern for reliable automation:

```typescript
// Step 1: Observe to find candidate actions
const actions = await stagehand.observe(
  "find the submit button",
  { page: ppPage }
);

// Step 2: Execute the first action
if (actions.length > 0) {
  await stagehand.act(actions[0], { page: ppPage });
}
```

This pattern helps avoid DOM changes between observation and action execution.

## Key Points

- **Connect via WebSocket**: Use `puppeteer.connect()` with `stagehand.connectURL()` as the `browserWSEndpoint`
- **Pass the page**: Always pass the Puppeteer `page` object to Stagehand methods using the `{ page }` option
- **Disable viewport**: Set `defaultViewport: null` to use Stagehand's viewport settings
- **Multi-page support**: Create multiple pages with `browser.newPage()` and pass them to Stagehand methods

## Environment Variables

When using Browserbase, set your credentials:

```bash
BROWSERBASE_API_KEY=your_api_key
BROWSERBASE_PROJECT_ID=your_project_id
```

For OpenAI (or other providers):

```bash
OPENAI_API_KEY=your_api_key
```

## Comparison: Stagehand Native vs Puppeteer

| Feature | Stagehand Native | With Puppeteer |
|---------|------------------|----------------|
| **Setup** | Simple - use `stagehand.context.pages()` | Requires `puppeteer.connect()` |
| **Page Access** | `stagehand.context.pages()[0]` | `await browser.pages()` |
| **AI Methods** | `stagehand.act("click")` | `stagehand.act("click", { page: ppPage })` |
| **Best For** | Pure Stagehand workflows | Existing Puppeteer codebases |

## Next Steps

<CardGroup cols={2}>
  <Card title="Agent" icon="robot" href="/v3/references/agent">
    Automate entire workflows
  </Card>
  <Card title="Act" icon="play" href="/v3/references/act">
    Execute actions on web pages
  </Card>
  <Card title="Extract" icon="ufo-beam" href="/v3/references/extract">
    Extract structured data from pages
  </Card>
  <Card title="Observe" icon="eye" href="/v3/references/observe">
    Observe and find elements on pages
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/selenium.mdx
================================================
---
title: Selenium
description: Use Stagehand with Selenium to operate the same browser in tandem
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

Stagehand v3 can work alongside Selenium WebDriver, allowing both tools to operate on the same browser session simultaneously. This enables you to combine Stagehand's AI-powered automation with Selenium's precise element interactions.

<Warning>
**Browserbase Only**: This integration requires Browserbase. It does not work with `env: "LOCAL"` because Selenium needs a remote WebDriver endpoint.
</Warning>

## Installation

Install Stagehand, Selenium, and the Browserbase SDK:

```bash
npm install @browserbasehq/stagehand selenium-webdriver @browserbasehq/sdk
```

## Quickstart

### Create Shared Session

Use the Browserbase SDK to create a session that both tools can connect to:

```typescript
import http from "http";
import { Builder, Key } from "selenium-webdriver";
import Browserbase from "@browserbasehq/sdk";
import { Stagehand } from "@browserbasehq/stagehand";

const bb = new Browserbase({
  apiKey: process.env.BROWSERBASE_API_KEY,
});

// Create shared session
const session = await bb.sessions.create({
  projectId: process.env.BROWSERBASE_PROJECT_ID,
});

console.log("Session created:", session.id);
```

### Connect Stagehand

Initialize Stagehand with the session ID:

```typescript
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  browserbaseSessionID: session.id,
  model: "openai/gpt-5",
  verbose: 2,
});

await stagehand.init();
```

### Connect Selenium

Use a custom HTTP agent with the session's signing key:

```typescript
// Create custom HTTP agent with signing key
const customHttpAgent = new http.Agent({});
(customHttpAgent as any).addRequest = (req: any, options: any) => {
  req.setHeader("x-bb-signing-key", session.signingKey);
  (http.Agent.prototype as any).addRequest.call(customHttpAgent, req, options);
};

// Connect Selenium WebDriver
const driver = new Builder()
  .forBrowser("chrome")
  .usingHttpAgent(customHttpAgent)
  .usingServer(session.seleniumRemoteUrl)
  .build();
```

### Use Both Tools Together

Now both Stagehand and Selenium operate on the same browser:

```typescript
// Navigate with Stagehand
const page = stagehand.context.pages()[0];
await page.goto("https://www.google.com");

// Extract page content with Stagehand AI
const pageContent = await stagehand.extract();
console.log("Page content:", pageContent);

// Use Selenium for precise element interaction
const searchBox = await driver.findElement({ name: "q" });
await searchBox.sendKeys("Browserbase automation");
await searchBox.sendKeys(Key.RETURN);

// Wait for results
await driver.sleep(2000);

console.log("Search completed!");
```

## Key Points

- **Shared Session**: Both tools connect to the same Browserbase session
- **Signing Key**: Selenium requires the session's `signingKey` in HTTP headers
- **Remote URL**: Use `session.seleniumRemoteUrl` for Selenium's server endpoint
- **Concurrent Usage**: Both tools can operate on the browser simultaneously
- **Cleanup**: Close both Stagehand (`await stagehand.close()`) and Selenium (`await driver.quit()`)

## Next Steps

<CardGroup cols={2}>
  <Card title="Agent" icon="robot" href="/v3/references/agent">
    Automate entire workflows
  </Card>
  <Card title="Act" icon="play" href="/v3/references/act">
    Execute actions on web pages
  </Card>
  <Card title="Extract" icon="ufo-beam" href="/v3/references/extract">
    Extract structured data from pages
  </Card>
  <Card title="Observe" icon="eye" href="/v3/references/observe">
    Observe and find elements on pages
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/integrations/vercel/configuration.mdx
================================================
---
title: Use Stagehand in Next.js
sidebarTitle: Configuration
description: Next.js is a popular framework for developing web-based applications in production. It powers Stagehand apps like [Director](https://director.ai), [Brainrot](https://brainrot.run) and [Open Operator](https://operator.browserbase.com).
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<Card
  title="Check out the Stagehand Next.js Quickstart"
  icon="github"
  href="https://github.com/browserbase/stagehand-nextjs-quickstart"
>
  Clone our [GitHub repo](https://github.com/browserbase/stagehand-nextjs-quickstart) to get started with Stagehand (v2) in Next.js.
</Card>

## Add Stagehand to an existing Next.js project
If you'd like to start from scratch, you can run:

<Tabs>
<Tab title="npm">
```bash
npm create next-app@latest stagehand-nextjs --yes
cd stagehand-nextjs
```
</Tab>
<Tab title="pnpm">
```bash
pnpm create next-app@latest stagehand-nextjs --yes
cd stagehand-nextjs
```
</Tab>
<Tab title="yarn">
```bash
yarn create next-app@latest stagehand-nextjs --yes
cd stagehand-nextjs
```
</Tab>
</Tabs>

If you'd like to add Stagehand to an existing Next.js project, you can do so by installing the dependencies:
<Tabs>
	<Tab title="npm">
	```bash
	npm install @browserbasehq/stagehand @browserbasehq/sdk playwright zod
	```
	</Tab>

	<Tab title="pnpm">
	```bash
	pnpm add @browserbasehq/stagehand @browserbasehq/sdk playwright zod
	```
	</Tab>

	<Tab title="yarn">
	```bash
	yarn add @browserbasehq/stagehand @browserbasehq/sdk playwright zod
	```
	</Tab>
</Tabs>

### Add environment variables
Next, let's add the environment variables to a `.env` file.
```env
BROWSERBASE_API_KEY=your-browserbase-api-key
BROWSERBASE_PROJECT_ID=your-browserbase-project-id
OPENAI_API_KEY=your-openai-api-key
```

### Write a server action
Next, let's define our `main` function as a server action in `app/stagehand/main.ts`. This file will have the following three functions:

1. **`main`: Run the main Stagehand script**
2. **`runStagehand`: Initialize and run the `main` function**
3. **`startBBSSession`: Start a Browserbase session**

```ts app/stagehand/main.ts
// 🤘 Welcome to Stagehand!
// This file is from the [Stagehand docs](https://docs.stagehand.dev/sections/examples/nextjs).

"use server";

import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod";
import { Browserbase } from "@browserbasehq/sdk";

/**
 * Run the main Stagehand script
 */
async function main(stagehand: Stagehand) {
  // You can use the `page` instance to write any Playwright code
  // For more info: https://playwright.dev/docs/pom
  const page = stagehand.context.activePage();

  // In this example, we'll get the title of the Stagehand quickstart page
  await page?.goto("https://docs.stagehand.dev/");
  await stagehand.act("click the quickstart link");
  const { title } = await stagehand.extract(
    "extract the main heading of the page",
    z.object({
      title: z.string(),
    }),
  );

  return title;
}

/**
 * Initialize and run the main() function
 */
export async function runStagehand(sessionId?: string) {
  const stagehand = new Stagehand({
    env: "BROWSERBASE",
    apiKey: process.env.BROWSERBASE_API_KEY,
    projectId: process.env.BROWSERBASE_PROJECT_ID,
    verbose: 1,
    logger: console.log,
    browserbaseSessionID: sessionId,
    disablePino: true,
  });
  await stagehand.init();
  const result = await main(stagehand);
  console.log(result);
  await stagehand.close();
}

/**
 * Start a Browserbase session
 */
export async function startBBSSession() {
  const browserbase = new Browserbase();
  const session = await browserbase.sessions.create({
    projectId: process.env.BROWSERBASE_PROJECT_ID!,
  });
  const debugUrl = await browserbase.sessions.debug(session.id);
  return {
    sessionId: session.id,
    debugUrl: debugUrl.debuggerFullscreenUrl,
  };
}
```

### Create a client component
Next, let's create a client component that will start a Browserbase session and run the `main` function with the server actions we just defined. We'll first create a Browserbase session and embed the session in an iframe before running the `main` function.

```tsx app/components/stagehandEmbed.tsx
"use client";

import { useCallback, useState } from "react";
import { runStagehand, startBBSSession } from "@/app/stagehand/main";

export function StagehandEmbed() {
  const [sessionId, setSessionId] = useState<string | null>(null);
  const [debugUrl, setDebugUrl] = useState<string | null>(null);

  const startSession = useCallback(async () => {
    const { sessionId, debugUrl } = await startBBSSession();
    setSessionId(sessionId);
    setDebugUrl(debugUrl);
    await runStagehand(sessionId);
  }, []);

  return (
    <div>
      {!sessionId && <button onClick={startSession}>Start Session</button>}
      {sessionId && debugUrl && (
        <iframe src={debugUrl} className="w-full h-full" />
      )}
    </div>
  );
}
```

### Use the `StagehandEmbed` component
Now, we can use the `StagehandEmbed` component in our app.

```tsx app/page.tsx
import { StagehandEmbed } from "@/app/components/stagehandEmbed";

export default function Home() {
	return (
		<main>
			<StagehandEmbed />
		</main>
	)
}
```

### Run the app
To run the app, you can use the following command:

<Tabs>
<Tab title="npm">
```bash
npm run dev
```
</Tab>
<Tab title="pnpm">
```bash
pnpm dev
```
</Tab>
<Tab title="yarn">
```bash
yarn dev
```
</Tab>
</Tabs>

### Deploy the app
To deploy the app, you can use the following commands. First, install the Vercel CLI:
<Tabs>
<Tab title="npm">
```bash
npm add -g vercel
```
</Tab>
<Tab title="pnpm">
```bash
pnpm add -g vercel
```
</Tab>
<Tab title="yarn">
```bash
yarn add -g vercel
```
</Tab>
</Tabs>

Then, run the following command to deploy the app:
```bash
vercel
```

## References

<CardGroup cols={2}>
  <Card title="Deploy Template (v2)" icon="rocket" href="https://vercel.com/templates/ai/stagehand-next-js-quickstart">
    One‑click deploy the Stagehand Next.js template on Vercel (Stagehand v2)
  </Card>
  
  <Card title="Source Cod (v2)" icon="github" href="https://github.com/browserbase/stagehand-nextjs-quickstart">
    Browse the complete template repository on GitHub (Stagehand v2)
  </Card>
</CardGroup>

================================================
FILE: packages/docs/v3/integrations/vercel/introduction.mdx
================================================
---
title: "Next.js + Vercel"
sidebarTitle: "Introduction"
description: "Build and deploy a Stagehand‑powered Next.js app to Vercel"
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Overview

The Stagehand + Next.js Quickstart is a production‑ready template that pairs Stagehand's AI browser automation with a modern Next.js app, deployable in one click on Vercel.

<CardGroup cols={3}>
  <Card title="Deploy Template" icon="rocket" href="https://vercel.com/templates/ai/stagehand-next-js-quickstart">
    One‑click deploy to Vercel with environment setup
  </Card>

  <Card title="Live Demo" icon="globe" href="https://stagehand-nextjs-quickstart.vercel.app">
    See the deployed template in action
  </Card>

  <Card title="Source Code" icon="github" href="https://github.com/browserbase/stagehand-nextjs-quickstart">
    Browse the repository on GitHub (Stagehand v2)
  </Card>
</CardGroup>

## What you get

<CardGroup cols={2}>
  <Card title="App Router project" icon="browser">
    Next.js App Router scaffold with Tailwind styling
  </Card>
  <Card title="Server‑safe automation" icon="shield-check">
    Uses Browserbase for cloud browsers (works on Vercel functions)
  </Card>
  <Card title="Prewired config" icon="gear">
    `stagehand.config.ts` with model + provider switching
  </Card>
  <Card title="Automation ready" icon="robot">
    Example usage of Stagehand primitives
  </Card>
</CardGroup>

## Requirements

- **Node 18+** locally
- **Model key**: OpenAI or Anthropic (or plug a custom client)
- **Browserbase keys**: `BROWSERBASE_API_KEY` and `BROWSERBASE_PROJECT_ID` for cloud browsers

<Tip>
Local Playwright browsers are not available on Vercel. Set Stagehand to Browserbase when deploying.
</Tip>

## Links

<CardGroup cols={2}>
  <Card title="Walkthrough" icon="rocket" href="/integrations/vercel/configuration">
    Run locally and deploy to Vercel in minutes
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/migrations/python.mdx
================================================
---
title: Migrate Python v2 to v3
sidebarTitle: Migrate Python v2 to v3
description: Complete migration guide from Stagehand Python SDK v2 to the new Stainless-based v3 SDK
icon: 'snake'
---

This guide helps you migrate from the legacy Stagehand Python SDK to the new Stainless-based SDK with a **Bring Your Own Browser (BYOB)** architecture.

<Note>
The new Python SDK is a pure API client. You manage the browser yourself using Playwright, Selenium, Puppeteer, or any other browser automation tool. The SDK handles only the AI-powered operations.
</Note>

## Overview of Changes

<CardGroup cols={2}>
  <Card title="BYOB Architecture" icon="browser">
    You bring your own browser driver (Playwright, Selenium, etc.). The SDK is now a pure API client that handles AI-powered operations.
  </Card>
  <Card title="Session-Based API" icon="key">
    All operations require an explicit `session_id`. Start a session, perform operations, and end it when done.
  </Card>
  <Card title="Multi-Browser Control" icon="browsers">
    Scale browsers easily and control multiple browsers at once by passing the session ID for each browser you want to control.
  </Card>
  <Card title="Simplified Client" icon="code">
    Cleaner initialization with dedicated parameters for API keys and configuration.
  </Card>
</CardGroup>

### Current Limitations

<Warning>
The new SDK does **not yet support**:
- Custom Python LLM client classes (e.g., `model_client_options`)
- However, we do support custom endpoints like Bedrock or LLM proxies as long as they are OpenAI-API compatible
</Warning>

---

## Step-by-Step Migration

### 1. Update Imports

<Tabs>
<Tab title="Old SDK (v2)">

```python
import asyncio
import logging
from stagehand import Stagehand, StagehandConfig, configure_logging

# Configure logging
configure_logging(
    level=logging.INFO,
    remove_logger_name=True,
    quiet_dependencies=True,
)
```

</Tab>
<Tab title="New SDK (v3)">

```python
import os
from playwright.sync_api import sync_playwright
from stagehand import Stagehand

# Note: Custom logging configuration is not yet supported.
# Use standard Python logging if needed:
import logging
logging.basicConfig(level=logging.INFO)
```

</Tab>
</Tabs>

---

### 2. Client Initialization

<Tabs>
<Tab title="Old SDK (v2)">

```python
config = StagehandConfig(
    env="BROWSERBASE",
    api_key=os.getenv("BROWSERBASE_API_KEY"),
    project_id=os.getenv("BROWSERBASE_PROJECT_ID"),
    headless=False,
    dom_settle_timeout_ms=3000,
    model_name="google/gemini-2.0-flash",
    self_heal=True,
    wait_for_captcha_solves=True,
    system_prompt="You are a browser automation assistant...",
    model_client_options={"apiKey": os.getenv("MODEL_API_KEY")},
    verbose=2,
)

stagehand = Stagehand(config)
await stagehand.init()
page = stagehand.page
```

</Tab>
<Tab title="New SDK (v3)">

```python
SDK_VERSION = "3.0.6"

# Create the Stagehand API client
client = Stagehand(
    browserbase_api_key=os.environ.get("BROWSERBASE_API_KEY"),
    browserbase_project_id=os.environ.get("BROWSERBASE_PROJECT_ID"),
    model_api_key=os.environ.get("MODEL_API_KEY"),
)

# Start a session (returns session metadata)
start_response = client.sessions.start(
    model_name="google/gemini-2.0-flash",
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
session_id = start_response.data.session_id
print(f"Session started: {session_id}")

# Connect Playwright to the Browserbase session
playwright = sync_playwright().start()
browser = playwright.chromium.connect_over_cdp(
    f"wss://connect.browserbase.com?apiKey={os.environ['BROWSERBASE_API_KEY']}&sessionId={session_id}"
)
context = browser.contexts[0]
page = context.pages[0] if context.pages else context.new_page()
```

</Tab>
</Tabs>

<Info>
**Key differences:**
- Configuration options like `dom_settle_timeout_ms`, `self_heal`, `system_prompt`, and `verbose` are not available in the new SDK
- `model_name` is specified when starting a session, not in the config
- You must connect Playwright separately to interact with the page
</Info>

---

### 3. Navigation

<Tabs>
<Tab title="Old SDK (v2)">

```python
await page.goto("https://google.com/")
```

</Tab>
<Tab title="New SDK (v3) - Option A: Playwright">

```python
# Recommended for simple navigation
page.goto("https://google.com/")
```

</Tab>
<Tab title="New SDK (v3) - Option B: Stagehand API">

```python
# Use this if you need Stagehand to track navigation state
client.sessions.navigate(
    id=session_id,
    url="https://google.com/",
    frame_id="",  # Empty string for main frame
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
```

</Tab>
</Tabs>

---

### 4. Direct Page Interactions (Playwright)

Any direct page manipulation should use Playwright's native API.

<Tabs>
<Tab title="Old SDK (v2)">

```python
# Click using Playwright locator (this was already Playwright)
await page.get_by_role("link", name="About", exact=True).click()

# Keyboard input
await page.keyboard.press("Enter")
```

</Tab>
<Tab title="New SDK (v3)">

```python
# Same Playwright API, but synchronous (or use async Playwright if preferred)
page.get_by_role("link", name="About", exact=True).click()

# Keyboard input
page.keyboard.press("Enter")
```

</Tab>
</Tabs>

<Note>
In the old SDK, `page` was a Stagehand-enhanced Playwright page. In the new SDK, `page` is a standard Playwright page. Direct Playwright methods work the same way.
</Note>

---

### 5. AI-Powered Actions (`act`)

<Tabs>
<Tab title="Old SDK (v2)">

```python
await page.act("search for openai")
```

</Tab>
<Tab title="New SDK (v3)">

```python
act_response = client.sessions.act(
    id=session_id,
    input="search for openai",
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
print(f"Act completed: {act_response.data.result.message}")
```

</Tab>
</Tabs>

#### Acting on an Observed Element

<Tabs>
<Tab title="Old SDK (v2)">

```python
observed = await page.observe("find all articles")
if observed:
    await page.act(observed[0])
```

</Tab>
<Tab title="New SDK (v3)">

```python
observe_response = client.sessions.observe(
    id=session_id,
    instruction="find all articles",
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
results = observe_response.data.result

if results:
    element = results[0]
    act_response = client.sessions.act(
        id=session_id,
        input=element,  # Pass the observed element directly
        x_language="python",
        x_sdk_version=SDK_VERSION,
    )
```

</Tab>
</Tabs>

---

### 6. Observing Elements (`observe`)

<Tabs>
<Tab title="Old SDK (v2)">

```python
observed = await page.observe("find all articles")
if len(observed) > 0:
    element = observed[0]
    print(f"Found element: {element}")
```

</Tab>
<Tab title="New SDK (v3)">

```python
observe_response = client.sessions.observe(
    id=session_id,
    instruction="find all articles",
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
results = observe_response.data.result
print(f"Found {len(results)} possible actions")

if results:
    element = results[0]
    print(f"Found element: {element.description}")
```

</Tab>
</Tabs>

---

### 7. Extracting Data (`extract`)

<Tabs>
<Tab title="Old SDK (v2)">

```python
data = await page.extract("extract the first result from the search")
print(data.model_dump_json())
```

</Tab>
<Tab title="New SDK (v3)">

```python
extract_response = client.sessions.extract(
    id=session_id,
    instruction="extract the first result from the search",
    schema={
        "type": "object",
        "properties": {
            "title": {
                "type": "string",
                "description": "The title of the first search result"
            },
            "url": {
                "type": "string",
                "description": "The URL of the first search result"
            }
        },
        "required": ["title"]
    },
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
extracted_data = extract_response.data.result
print(f"Extracted: {extracted_data}")
```

</Tab>
</Tabs>

<Warning>
**Key difference:** The new SDK requires an explicit JSON schema for extraction. This provides better type safety and clearer expectations for the AI model.
</Warning>

---

### 8. Closing the Session

<Tabs>
<Tab title="Old SDK (v2)">

```python
await stagehand.close()
```

</Tab>
<Tab title="New SDK (v3)">

```python
# Clean up Playwright resources
browser.close()
playwright.stop()

# End the Stagehand session
client.sessions.end(
    id=session_id,
    x_language="python",
    x_sdk_version=SDK_VERSION,
)
```

</Tab>
</Tabs>

<Tip>
**Important:** Always clean up both Playwright and the Stagehand session. Use a `try/finally` block to ensure cleanup happens even on errors.
</Tip>

---

### 9. Async vs Sync

<Tabs>
<Tab title="Old SDK (v2) - Async-first">

```python
async def main():
    stagehand = Stagehand(config)
    await stagehand.init()
    await page.goto("https://example.com")
    await stagehand.close()

asyncio.run(main())
```

</Tab>
<Tab title="New SDK (v3) - Sync-first">

```python
def main():
    client = Stagehand(...)

    with sync_playwright() as playwright:
        # ... setup browser connection
        page.goto("https://example.com")
        # ... cleanup

main()
```

</Tab>
<Tab title="New SDK (v3) - Async">

```python
import asyncio
from playwright.async_api import async_playwright

async def main():
    client = Stagehand(...)  # Client is sync, but that's OK

    async with async_playwright() as playwright:
        browser = await playwright.chromium.connect_over_cdp(...)
        # ... async Playwright operations

asyncio.run(main())
```

</Tab>
</Tabs>

---

## Complete Migration Example

<Tabs>
<Tab title="Before (Old SDK)">

```python
import asyncio
import logging
import os

from dotenv import load_dotenv
from stagehand import Stagehand, StagehandConfig, configure_logging

configure_logging(level=logging.INFO, remove_logger_name=True, quiet_dependencies=True)
load_dotenv()

async def main():
    config = StagehandConfig(
        env="BROWSERBASE",
        api_key=os.getenv("BROWSERBASE_API_KEY"),
        project_id=os.getenv("BROWSERBASE_PROJECT_ID"),
        headless=False,
        model_name="google/gemini-2.0-flash",
        model_client_options={"apiKey": os.getenv("MODEL_API_KEY")},
        verbose=2,
    )

    stagehand = Stagehand(config)
    await stagehand.init()
    page = stagehand.page

    print(f"Session: {stagehand.session_id}")

    # Navigate
    await page.goto("https://google.com/")

    # Direct Playwright interaction
    await page.get_by_role("link", name="About", exact=True).click()

    # AI-powered action
    await page.goto("https://google.com/")
    await page.act("search for openai")
    await page.keyboard.press("Enter")

    # Observe and act
    observed = await page.observe("find all articles")
    if observed:
        await page.act(observed[0])

    # Extract data
    data = await page.extract("extract the first result")
    print(data.model_dump_json())

    await stagehand.close()

if __name__ == "__main__":
    asyncio.run(main())
```

</Tab>
<Tab title="After (New SDK)">

```python
import os
import logging

from dotenv import load_dotenv
from playwright.sync_api import sync_playwright
from stagehand import Stagehand

# Standard Python logging (custom Stagehand logging not yet supported)
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

load_dotenv()

SDK_VERSION = "3.0.6"

def main():
    # Create Stagehand API client
    client = Stagehand(
        browserbase_api_key=os.environ.get("BROWSERBASE_API_KEY"),
        browserbase_project_id=os.environ.get("BROWSERBASE_PROJECT_ID"),
        model_api_key=os.environ.get("MODEL_API_KEY"),
    )

    # Start a session
    start_response = client.sessions.start(
        model_name="google/gemini-2.0-flash",
        x_language="python",
        x_sdk_version=SDK_VERSION,
    )
    session_id = start_response.data.session_id
    logger.info(f"Session started: {session_id}")
    logger.info(f"View live: https://www.browserbase.com/sessions/{session_id}")

    # Connect Playwright to the Browserbase session
    with sync_playwright() as playwright:
        browser = playwright.chromium.connect_over_cdp(
            f"wss://connect.browserbase.com?apiKey={os.environ['BROWSERBASE_API_KEY']}&sessionId={session_id}"
        )
        context = browser.contexts[0]
        page = context.pages[0] if context.pages else context.new_page()

        try:
            # Navigate (using Playwright directly)
            page.goto("https://google.com/")
            logger.info("Navigated to Google")

            # Direct Playwright interaction
            page.get_by_role("link", name="About", exact=True).click()
            logger.info("Clicked About link")

            # Navigate back
            page.goto("https://google.com/")

            # AI-powered action (using Stagehand API)
            act_response = client.sessions.act(
                id=session_id,
                input="search for openai",
                x_language="python",
                x_sdk_version=SDK_VERSION,
            )
            logger.info(f"Act completed: {act_response.data.result.message}")

            # Keyboard input (using Playwright)
            page.keyboard.press("Enter")

            # Wait for results
            page.wait_for_timeout(2000)

            # Observe elements (using Stagehand API)
            observe_response = client.sessions.observe(
                id=session_id,
                instruction="find all articles",
                x_language="python",
                x_sdk_version=SDK_VERSION,
            )
            results = observe_response.data.result

            if results:
                element = results[0]
                logger.info(f"Found element: {element.description}")

                # Act on observed element
                client.sessions.act(
                    id=session_id,
                    input=element,
                    x_language="python",
                    x_sdk_version=SDK_VERSION,
                )
            else:
                logger.warning("No elements found")

            # Extract data (using Stagehand API with schema)
            extract_response = client.sessions.extract(
                id=session_id,
                instruction="extract the first result from the search",
                schema={
                    "type": "object",
                    "properties": {
                        "title": {"type": "string", "description": "Result title"},
                        "url": {"type": "string", "description": "Result URL"},
                        "snippet": {"type": "string", "description": "Result snippet"},
                    },
                    "required": ["title"],
                },
                x_language="python",
                x_sdk_version=SDK_VERSION,
            )
            logger.info(f"Extracted data: {extract_response.data.result}")

        finally:
            # Clean up Playwright
            browser.close()

            # End the Stagehand session
            client.sessions.end(
                id=session_id,
                x_language="python",
                x_sdk_version=SDK_VERSION,
            )
            logger.info("Session ended")

if __name__ == "__main__":
    main()
```

</Tab>
</Tabs>

---

## Quick Reference: Method Mapping

| Old SDK | New SDK |
|---------|---------|
| `Stagehand(config)` | `Stagehand(browserbase_api_key=..., ...)` |
| `await stagehand.init()` | `client.sessions.start(...)` |
| `stagehand.page` | Connect Playwright separately |
| `stagehand.session_id` | `start_response.data.session_id` |
| `await page.goto(url)` | `page.goto(url)` (Playwright) |
| `await page.act(instruction)` | `client.sessions.act(id=session_id, input=instruction, ...)` |
| `await page.observe(instruction)` | `client.sessions.observe(id=session_id, instruction=..., ...)` |
| `await page.extract(instruction)` | `client.sessions.extract(id=session_id, instruction=..., schema=..., ...)` |
| `await stagehand.close()` | `browser.close()` + `client.sessions.end(id=session_id, ...)` |
| `configure_logging(...)` | Use standard `logging` module |

---

## Troubleshooting

<AccordionGroup>
  <Accordion title="Session not found errors">
    Ensure you're using the correct `session_id` returned from `client.sessions.start()`.
  </Accordion>
  
  <Accordion title="Playwright connection issues">
    Make sure your Browserbase API key has the correct permissions and the session is still active.
  </Accordion>
  
  <Accordion title="Missing x_language and x_sdk_version parameters">
    These are required for all session operations. Use `x_language="python"` and `x_sdk_version="3.0.6"` (or the latest version).
  </Accordion>
  
  <Accordion title="Extraction returns unexpected format">
    The new SDK requires an explicit JSON schema. Make sure your schema matches the expected output structure.
  </Accordion>
</AccordionGroup>

---

## Need Help?

<CardGroup cols={3}>
  <Card title="Documentation" icon="book" href="https://docs.stagehand.dev/">
    Full Stagehand documentation
  </Card>
  <Card title="Browserbase Docs" icon="server" href="https://docs.browserbase.com/">
    Browserbase documentation
  </Card>
  <Card title="GitHub Issues" icon="github" href="https://github.com/browserbase/stagehand-python/issues">
    Report issues or get help
  </Card>
</CardGroup>


================================================
FILE: packages/docs/v3/migrations/v2.mdx
================================================
---
title: Migrate TypeScript v2 to v3
sidebarTitle: Migrate TypeScript v2 to v3
description: Complete migration guide from Stagehand TypeScript SDK v2 to v3
icon: 'arrow-up-right-dots'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


## Recommended Migration Process

1. **Backup your project**. If you use a version control system, make sure all previous versions are committed.
2. **Upgrade to Stagehand v3**.
3. Follow the breaking changes guide below.
4. Verify your project is working as expected.
5. Commit your changes.

## Stagehand v3 Package Version

Update your `package.json` to use Stagehand v3:

```bash Bash
npm install @browserbasehq/stagehand@latest
```

## Overview of Major Changes

Stagehand v3 introduces significant improvements to the API design and functionality:

- **Removing Playwright Dependency**: Stagehand v3 is now a standalone library that does not depend on Playwright. **You can still use Stagehand with Playwright, check out our [Playwright integration](/v3/integrations/playwright) for more details.**
- **Simplified Method Signatures**: Cleaner, more intuitive parameter structures.
- **Unified Model Configuration**: Model configuration is now consolidated into a single `model` parameter.
- **Automatic iframe & Shadow DOM Support**: No more manual flags required.
- **Improved Type Safety**: Better TypeScript inference and type checking.
- **Enhanced Multi-Page Support**: New Context API for managing multiple pages.
- **Streamlined Timeouts**: Consistent timeout naming across all methods.
- **Auto-caching**: Stagehand v3 now automatically caches actions and agent steps using the [file system cache](/best-practices/caching).
- **Agent Improvements**: Renamed parameters (`instructions` → `systemPrompt`), unified model configuration, and new `executionModel` option for cost optimization.


## Breaking Changes

### Stagehand Initialization

#### Model Configuration Consolidation

The `modelName` and `modelClientOptions` parameters have been unified into a single `model` parameter.

```typescript Stagehand v2 icon="/images/typescript.svg"
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "BROWSERBASE",
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  modelName: "openai/gpt-5",
  modelClientOptions: {
    apiKey: process.env.OPENAI_API_KEY
    baseURL: "https://custom-proxy.com/v1"
  }
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
import { Stagehand } from "@browserbasehq/stagehand";

// Option 1: String format (recommended for simplicity, auto-loads model API key from env)
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  model: "openai/gpt-5"
});

// Option 2: Object format (for advanced configuration)
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  model: {
    modelName: "gpt-5",
    apiKey: process.env.OPENAI_API_KEY,
    baseURL: "https://custom-proxy.com/v1"
  }
});
```

#### DOM Settle Timeout Rename

The `domSettleTimeoutMs` parameter has been renamed to `domSettleTimeout` for consistency.

```typescript Stagehand v2 icon="/images/typescript.svg"
const stagehand = new Stagehand({
  env: "LOCAL",
  domSettleTimeoutMs: 5000
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const stagehand = new Stagehand({
  env: "LOCAL",
  domSettleTimeout: 5000
});
```

#### Changes to return value of `stagehand.init()`

The `init()` used to return `debugUrl`, `sessionUrl` and `sessionId`

```typescript Stagehand v2 icon="/images/typescript.svg"
const result = await stagehand.init();
console.log(result);
```
In `v2`, the returned object contains:
```
{
  debugUrl: 'https://www.browserbase.com/devtools/inspector.html?wss=connect.browserbase.com/debug/f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0/devtools/page/5474B0E0510C5B6E629BEB06E799CD70?debug=true',
  sessionUrl: 'https://www.browserbase.com/sessions/f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0',
  sessionId: 'f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0'
}
```
In `v3` the return value is `Promise<void>`. The `sessionId`, `sessionUrl`, and `debugUrl` are now directly accessible via the stagehand object:
```typescript Stagehand v3 icon="/images/typescript.svg"
console.log("debugUrl: ", stagehand.browserbaseDebugURL)
console.log("sessionUrl: ", stagehand.browserbaseSessionURL)
console.log("sessionId: ", stagehand.browserbaseSessionID)
```
Example output:
```
debugUrl: 'https://www.browserbase.com/devtools/inspector.html?wss=connect.browserbase.com/debug/f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0/devtools/page/5474B0E0510C5B6E629BEB06E799CD70?debug=true',
sessionUrl: 'https://www.browserbase.com/sessions/f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0',
sessionId: 'f8a21b4a-6fa1-4ab9-9007-fbfe61dc14f0'
```

#### Caching Changes

The `enableCaching` boolean has been replaced with a `cacheDir` string for more flexible cache management.

```typescript Stagehand v2 icon="/images/typescript.svg"
const stagehand = new Stagehand({
  env: "LOCAL",
  enableCaching: true
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const stagehand = new Stagehand({
  env: "LOCAL",
  cacheDir: "./stagehand-cache"  // Specify cache directory
});
```

#### Page Access Changes

Direct page access has changed to use the Context API.

```typescript Stagehand v2 icon="/images/typescript.svg"
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();

// Direct page access
const page = stagehand.page;
await page.goto("https://example.com");
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();

// Access via context
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

// Or `await` the active page
const page = stagehand.context.awaitActivePage();
await page.goto("https://example.com");
```

### Context and Multi-Page Management

#### New Context API

v3 introduces a structured Context API for managing multiple pages.

```typescript Stagehand v2 icon="/images/typescript.svg"
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();

// Limited multi-page support
const page = stagehand.page;
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();

// Access all pages
const pages = stagehand.context.pages();
const mainPage = pages[0];

// Create new page
const newPage = await stagehand.context.newPage();

// Set active page
stagehand.context.setActivePage(newPage);

// implicitly takes action on newPage
await stagehand.act("click button");
```

### act() Method Changes

#### Method Signature Simplification

The `action` parameter has been removed from `ActOptions`. Now you only pass the instruction as a string.

```typescript Stagehand v2 icon="/images/typescript.svg"
await page.act({
  action: "click the login button",
  modelName: "openai/gpt-5-mini",
  variables: { username: "john" },
  timeoutMs: 10000,
  domSettleTimeoutMs: 5000,
  iframes: true
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// Clean, simple string instruction
await stagehand.act("click the login button");

// With options
await stagehand.act("click the login button", {
  model: "openai/gpt-5-mini",
  variables: { username: "john" },
  timeout: 10000,
  page: page  // Optional: specify which page
});
```

<Note>
**Method Location Change**: In v3, `act()` is called on the `stagehand` instance, not the `page` object.
</Note>

#### Model Configuration in act()

Model configuration follows the same pattern as initialization.

```typescript Stagehand v2 icon="/images/typescript.svg"
await page.act({
  action: "fill the form",
  modelName: "anthropic/claude-sonnet-4-5",
  modelClientOptions: {
    apiKey: process.env.ANTHROPIC_API_KEY
  }
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// String format
await stagehand.act("fill the form", {
  model: "anthropic/claude-sonnet-4-5"
});

// Object format
await stagehand.act("fill the form", {
  model: {
    modelName: "anthropic/claude-sonnet-4-5",
    apiKey: process.env.ANTHROPIC_API_KEY
  }
});
```

#### Timeout Parameter Rename

`timeoutMs` has been renamed to `timeout`.

```typescript Stagehand v2 icon="/images/typescript.svg"
await page.act({
  action: "click button",
  timeoutMs: 15000
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
await stagehand.act("click button", {
  timeout: 15000
});
```

#### Automatic iframe Support

The `iframes` flag has been removed. iframe support is now automatic.

```typescript Stagehand v2 icon="/images/typescript.svg"
await page.act({
  action: "click button inside iframe",
  iframes: true  // Required to interact with iframes
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// Automatic iframe support - no flag needed
await stagehand.act("click button inside iframe");
```

<Note>
**Automatic Support**: Stagehand v3 automatically handles iframe and Shadow DOM interactions without requiring explicit flags.
</Note>

#### Result Structure Changes

The `ActResult` structure has been enhanced with more detailed information.

```typescript Stagehand v2 icon="/images/typescript.svg"
const result = await page.act("click the button");
console.log(result.action);  // Single action string
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const result = await stagehand.act("click the button");
console.log(result.actionDescription);  // Overall description
console.log(result.actions);  // Array of action details

// ActResult structure:
// {
//   success: boolean;
//   message: string;
//   actionDescription: string;
//   actions: Array<{
//     selector: string;
//     description: string;
//     method?: string;
//     arguments?: string[];
//   }>;
// }
```

### extract() Method Changes

#### Method Location and Signature

`extract()` has moved from the page object to the stagehand instance, with a cleaner parameter structure.

```typescript Stagehand v2 icon="/images/typescript.svg"
import { z } from "zod";

const result = await page.extract({
  instruction: "extract product details",
  schema: z.object({
    name: z.string(),
    price: z.number()
  }),
  modelName: "openai/gpt-5",
  domSettleTimeoutMs: 5000,
  selector: "xpath=/html/body/div",
  iframes: true
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
import { z } from "zod";

// Cleaner parameter structure
const result = await stagehand.extract(
  "extract product details",
  z.object({
    name: z.string(),
    price: z.number()
  }),
  {
    model: "openai/gpt-5",
    selector: ".container", // NEW: CSS selector support
    timeout: 10000,
    page: page  // Optional: specify which page
  }
);
```

<Note>
**Parameter Order**: In v3, `instruction` and `schema` are separate positional parameters, with `options` as an optional third parameter.
</Note>

#### Extract Without Schema

Schema-less extraction also has a simpler interface.

```typescript Stagehand v2 icon="/images/typescript.svg"
// String instruction
const result = await page.extract("get the page title");
// Returns: { extraction: "Page Title" }

// Raw page content
const content = await page.extract();
// Returns: { page_text: "..." }
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// String instruction
const result = await stagehand.extract("get the page title");
// Returns: { extraction: "Page Title" }

// Raw page content
const content = await stagehand.extract();
// Returns: { pageText: "..." }
```

#### Model Configuration in extract()

```typescript Stagehand v2 icon="/images/typescript.svg"
const data = await page.extract({
  instruction: "extract data",
  schema: DataSchema,
  modelName: "anthropic/claude-sonnet-4-5",
  modelClientOptions: {
    apiKey: process.env.ANTHROPIC_API_KEY
  }
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const data = await stagehand.extract(
  "extract data",
  DataSchema,
  {
    model: "anthropic/claude-sonnet-4-5"
  }
);
```

#### Automatic iframe Support

```typescript Stagehand v2 icon="/images/typescript.svg"
const data = await page.extract({
  instruction: "extract data from iframe",
  schema: DataSchema,
  iframes: true  // Required for iframe content
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// Automatic iframe support
const data = await stagehand.extract(
  "extract data from iframe",
  DataSchema
);
```

#### Array Schema Changes

Array extraction now has a more ergonomic syntax.

```typescript Stagehand v2 icon="/images/typescript.svg"
import { z } from "zod";

// Had to wrap array in object
const ApartmentListingsSchema = z.object({
  apartments: z.array(z.object({
    address: z.string(),
    price: z.string(),
    bedrooms: z.number()
  }))
});

const result = await page.extract({
  instruction: "extract all apartment listings",
  schema: ApartmentListingsSchema
});

// Access via: result.apartments
```

```typescript Stagehand v3 icon="/images/typescript.svg"
import { z } from "zod";

// Can use array schema directly
const ApartmentListingsSchema = z.array(
  z.object({
    address: z.string(),
    price: z.string(),
    bedrooms: z.number()
  })
);

const result = await stagehand.extract(
  "extract all apartment listings",
  ApartmentListingsSchema
);

// Result is directly the array
console.log(result[0].address);
```

### observe() Method Changes

#### Method Signature Updates

```typescript Stagehand v2 icon="/images/typescript.svg"
const results = await page.observe({
  instruction: "find all buttons",
  modelName: "openai/gpt-5",
  domSettleTimeoutMs: 5000,
  drawOverlay: true,
  iframes: true
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const results = await stagehand.observe("find all buttons", {
  model: "openai/gpt-5",
  timeout: 10000,
  selector: ".container",  // NEW: scope observation to selector
  page: page  // Optional: specify which page
});
```

<Note>
**Method Location Change**: Like `act()` and `extract()`, `observe()` is now called on the `stagehand` instance.
</Note>

#### Draw Overlay Removed

The `drawOverlay` option has been removed in v3.

```typescript Stagehand v2 icon="/images/typescript.svg"
const results = await page.observe({
  instruction: "find buttons",
  drawOverlay: true  // Visual debugging
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// drawOverlay is no longer available
const results = await stagehand.observe("find buttons");
```

#### Automatic iframe Support

```typescript Stagehand v2 icon="/images/typescript.svg"
const results = await page.observe({
  instruction: "find elements in iframe",
  iframes: true
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// Automatic iframe support
const results = await stagehand.observe("find elements in iframe");
```

#### Observe with act() Integration

The observe → act workflow remains similar but with updated method signatures.

```typescript Stagehand v2 icon="/images/typescript.svg"
const [action] = await page.observe("find the login button");
await page.act(action);
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const [action] = await stagehand.observe("find the login button");
await stagehand.act(action);
```

### agent() Method Changes

#### Agent Configuration Updates

The agent configuration has been significantly restructured in v3 with renamed parameters and new capabilities.

```typescript Stagehand v2 icon="/images/typescript.svg"
const agent = stagehand.agent({
  provider: "google",
  model: "gemini-2.5-computer-use-preview-10-2025",
  instructions: "You are a helpful assistant that can navigate websites.",
  options: {
    apiKey: process.env.GEMINI_API_KEY
  },
  integrations: ["https://mcp-server.example.com"],
  tools: customTools
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const agent = stagehand.agent({
  model: "google/gemini-2.5-computer-use-preview-10-2025",  // Provider now in model string
  systemPrompt: "You are a helpful assistant that can navigate websites.",  // Renamed from 'instructions'
  mode: "cua",  // Computer Use Agent mode
  integrations: ["https://mcp-server.example.com"],
  tools: customTools
});
```

<Note>
**Key Changes**:
- `provider` removed - now part of the model string (e.g., `"anthropic/claude-sonnet-4-5"`)
- `instructions` renamed to `systemPrompt`
- `options` removed - use model object format for advanced configuration
- `executionModel` added - specify a different model for tool execution
- `cua` flag added - enable/disable Computer Use Agent mode
</Note>

#### Model Configuration in agent()

Model configuration follows the same unified pattern as other methods.

```typescript Stagehand v2 icon="/images/typescript.svg"
const agent = stagehand.agent({
  provider: "google",
  model: "gemini-2.5-computer-use-preview-10-2025",
  options: {
    apiKey: process.env.GEMINI_API_KEY,
    baseURL: "https://custom-proxy.com/v1"
  }
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
// String format (recommended)
const agent = stagehand.agent({
  model: "google/gemini-2.5-computer-use-preview-10-2025"
});

// Object format for advanced configuration
const agent = stagehand.agent({
  model: {
    modelName: "gemini-2.5-computer-use-preview-10-2025",
    apiKey: process.env.GEMINI_API_KEY,
    baseURL: "https://custom-proxy.com/v1"
  }
});
```

#### Execute Method Changes

The `execute()` method has been simplified with some options removed and new ones added.

```typescript Stagehand v2 icon="/images/typescript.svg"
const result = await agent.execute({
  instruction: "Search for products",
  maxSteps: 20,
  autoScreenshot: true,
  waitBetweenActions: 1000,
  context: "Focus on electronics category"
});
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const result = await agent.execute({
  instruction: "Search for products",
  maxSteps: 20,
  page: page,  // NEW: specify which page to operate on
  highlightCursor: true  // NEW: visual cursor for debugging
});
```

<Warning>
**Removed Options**:
- `autoScreenshot` - no longer available
- `waitBetweenActions` - no longer available
- `context` - use the `systemPrompt` in agent config instead
</Warning>

#### Execution Model Configuration

v3 introduces a new `executionModel` option to use a different (often faster/cheaper) model for tool execution.

```typescript Stagehand v3 icon="/images/typescript.svg"
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5",  // Main reasoning model
  executionModel: "anthropic/claude-haiku-4-5"  // Faster model for tool execution (act, extract, observe)
});

// The agent will use claude-sonnet-4-5 for high-level reasoning
// but claude-haiku-4-5 for executing individual actions
const result = await agent.execute("Complete the checkout process");
```

#### Agent with Multi-Page Support

v3 agents can now specify which page to operate on.

```typescript Stagehand v3 icon="/images/typescript.svg"
const page1 = stagehand.context.pages()[0]
const page2 = await stagehand.context.newPage();

const agent = stagehand.agent({
  model: "google/gemini-2.5-computer-use-preview-10-2025"
});

// Execute on specific page
await page2.goto("https://example.com/dashboard");
const result = await agent.execute({
  instruction: "Export the data table",
  page: page2  // Operate on page2 instead of default page
});
```

### History and Metrics

#### History API

History is now async and returns a promise.

```typescript Stagehand v2 icon="/images/typescript.svg"
const history = stagehand.history;
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const history = await stagehand.history;
```

#### Metrics API

Metrics is now async and returns a promise.

```typescript Stagehand v2 icon="/images/typescript.svg"
const metrics = stagehand.metrics;
```

```typescript Stagehand v3 icon="/images/typescript.svg"
const metrics = await stagehand.metrics;
```

## Complete Migration Example

Here's a complete example showing a full migration:

<Tabs>
<Tab title="Stagehand v2">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod";

// Initialize
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  modelName: "openai/gpt-5",
  modelClientOptions: {
    apiKey: process.env.OPENAI_API_KEY
  },
  enableCaching: true,
  domSettleTimeoutMs: 5000
});

await stagehand.init();
const page = stagehand.page;

// Navigate
await page.goto("https://example.com");

// Act
await page.act({
  action: "click the login button",
  timeoutMs: 10000,
  iframes: true
});

// Extract
const ProductSchema = z.object({
  name: z.string(),
  price: z.number(),
  inStock: z.boolean()
});

const product = await page.extract({
  instruction: "extract product details",
  schema: ProductSchema,
  domSettleTimeoutMs: 5000,
  iframes: true
});

// Observe
const actions = await page.observe({
  instruction: "find all buttons",
  drawOverlay: false,
  iframes: true
});

await stagehand.close();
```

</Tab>
<Tab title="Stagehand v3">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod";

// Initialize - simplified configuration
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  model: "openai/gpt-5",  // Unified model configuration
  cacheDir: "./cache",      // Flexible cache directory
  domSettleTimeout: 5000    // Consistent naming
});

await stagehand.init();
const page = stagehand.context.pages()[0];  // Context API

// Navigate
await page.goto("https://example.com");

// Act - cleaner interface, automatic iframe support
await stagehand.act("click the login button", {
  timeout: 10000
  // No iframes flag needed - automatic!
});

// Extract - cleaner parameter order
const ProductSchema = z.object({
  name: z.string(),
  price: z.number(),
  inStock: z.boolean()
});

const product = await stagehand.extract(
  "extract product details",
  ProductSchema
  // Automatic iframe support, no extra flags needed
);

// Observe - simplified
const actions = await stagehand.observe("find all buttons");
// Automatic iframe support

// Get metrics
const metrics = await stagehand.metrics;
console.log('Total tokens used:',
  metrics.totalPromptTokens + metrics.totalCompletionTokens);

await stagehand.close();
```

</Tab>
</Tabs>

## Quick Reference: Breaking Changes

<Expandable title="Stagehand Initialization">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **Model Config** | `modelName` + `modelClientOptions` | `model: "provider/model"` or `{ modelName, apiKey, baseURL }` |
| **DOM Settle** | `domSettleTimeoutMs` | `domSettleTimeout` |
| **Caching** | `enableCaching: boolean` | `cacheDir: string` |
| **Page Access** | `stagehand.page` | `stagehand.context.pages()[0]` |

</Expandable>

<Expandable title="act()">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **Method location** | `page.act()` | `stagehand.act()` |
| **Parameters** | `{ action, ...options }` | `(instruction, options?)` |
| **Timeout** | `timeoutMs` | `timeout` |
| **Result structure** | `{ action }` | `{ actionDescription, actions[] }` |

</Expandable>

<Expandable title="extract()">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **Method location** | `page.extract()` | `stagehand.extract()` |
| **Parameters** | `{ instruction, schema, ...options }` | `(instruction, schema, options?)` |

</Expandable>

<Expandable title="observe()">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **Method location** | `page.observe()` | `stagehand.observe()` |
| **Draw overlay** | `drawOverlay: boolean` | Removed |

</Expandable>

<Expandable title="agent()">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **Provider** | `provider: "openai" \| "anthropic"` | Part of model string |
| **Instructions** | `instructions: string` | `systemPrompt: string` |
| **Model** | `model: "model-name"` | `model: "provider/model-name"` |
| **Options** | `options: Record<string, unknown>` | Use model object format |
| **Execute params** | `autoScreenshot`, `waitBetweenActions`, `context` | Removed; added `page`, `highlightCursor` |

</Expandable>

<Expandable title="Automatic Features">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **iframe support** | `iframes: true` flag required | Automatic (no flag needed) |
| **Shadow DOM** | Manual handling | Automatic (no flag needed) |

</Expandable>

<Expandable title="Properties & Methods">

| Feature | Stagehand v2 | Stagehand v3 |
|---------|--------------|--------------|
| **History** | `stagehand.history` | `await stagehand.history` |
| **Metrics** | `stagehand.metrics` | `await stagehand.metrics` |

</Expandable>

## Troubleshooting

### Error: Cannot find property 'page' on Stagehand instance

**Problem**: Direct `stagehand.page` is not supported in Stagehand v3.

**Solution**: Use the Context API or `await` the active page:

```typescript
// Use context API (recommended)
const page = stagehand.context.pages()[0];

// Or grab the active page
const page = await stagehand.context.awaitActivePage();
```

### Error: act() method not found on page

**Problem**: v3 moved `act()`, `extract()`, and `observe()` to the stagehand instance.

**Solution**: Call these methods on the stagehand instance:

```typescript
// v2 ❌
await page.act("click button");

// v3 ✅
await stagehand.act("click button");
```

### TypeScript: Model configuration type errors

**Problem**: TypeScript errors with model configuration.

**Solution**: Use the proper format:

```typescript
// String format
model: "openai/gpt-5"

// Object format
model: {
  modelName: "openai/gpt-5",
  apiKey: process.env.OPENAI_API_KEY
}
```

### Agent configuration errors

**Problem**: Using old `provider` and `instructions` parameters.

**Solution**: Update to v3 format:

```typescript
// v2 ❌
const agent = stagehand.agent({
  provider: "anthropic",
  model: "claude-sonnet-4-5",
  instructions: "You are a helpful assistant that..."
});

// v3 ✅
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5",
  systemPrompt: "You are a helpful assistant that..."
});
```

### Agent execute options not recognized

**Problem**: Using removed options like `autoScreenshot`, `waitBetweenActions`, or `context`.

**Solution**: Remove these options and use v3 alternatives:

```typescript
// v2 ❌
await agent.execute({
  instruction: "task",
  autoScreenshot: true,
  waitBetweenActions: 1000,
  context: "additional context"
});

// v3 ✅
const agent = stagehand.agent({
  model: "google/gemini-2.5-computer-use-preview-10-2025",
  systemPrompt: "Your context here."  // Move context to systemPrompt
});

await agent.execute({
  instruction: "task",
  highlightCursor: true  // Use new option for visual feedback
});
```

## Best Practices for v3

1. **Use the string model format** for simplicity: `model: "openai/gpt-5"`
2. **Leverage automatic iframe support** - remove all `iframes` flags
3. **Use the Context API** for multi-page scenarios
4. **Monitor metrics** to track token usage and optimize costs
5. **Use history** for debugging and understanding automation flow
6. **Set appropriate timeouts** based on your use case
7. **Specify cache directory** to improve performance for repeated actions
8. **Use executionModel for agents** - configure a faster/cheaper model for tool execution while keeping a powerful model for reasoning (e.g., `model: "anthropic/claude-sonnet-4-5"`, `executionModel: "google/gemini-2.0-flash"`)

## Additional Resources

- [Stagehand v3 Documentation](/v3/first-steps/introduction)
- [API Reference](/v3/references/stagehand)
- [Best Practices](/v3/best-practices/caching)
- [GitHub Issues](https://github.com/browserbase/stagehand/issues)

If you encounter any issues during migration, please [open an issue](https://github.com/browserbase/stagehand/issues) on our GitHub repository.


================================================
FILE: packages/docs/v3/references/act.mdx
================================================
---
title: act()
description: 'Complete API reference for the act() method'
icon: 'arrow-pointer'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Act" icon="arrow-pointer" href="/v3/basics/act">
  See how to use act() to perform browser actions
</Card>
</CardGroup>

### Method Signatures

<Tabs>
<Tab title="TypeScript">

```typescript
// String instruction only
await stagehand.act(instruction: string): Promise<ActResult>

// Action only - Deterministic (no LLM)
await stagehand.act(action: Action): Promise<ActResult>

// String instruction with options
await stagehand.act(instruction: string, options: ActOptions): Promise<ActResult>

```

**Action Interface:**
```typescript
interface Action {
  selector: string;
  description: string;
  method: string;
  arguments: string[];
}
```

**ActOptions Interface:**
```typescript
interface ActOptions {
  model?: ModelConfiguration;
  variables?: Record<string, VariableValue>;
  timeout?: number;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  serverCache?: boolean;
}

// VariableValue can be a simple primitive or a rich object:
type VariableValue =
  | string
  | number
  | boolean
  | { value: string | number | boolean; description?: string };

// ModelConfiguration can be either a string or an object
type ModelConfiguration =
  | string  // Format: "provider/model" (e.g., "openai/gpt-4o", "anthropic/claude-sonnet-4-6")
  | {
      modelName: string;  // The model name
      apiKey?: string;    // Optional: API key override
      baseURL?: string;   // Optional: Base URL override
      // Additional provider-specific options
    }
```

</Tab>

</Tabs>

### Parameters

<ParamField path="instruction | action" type="string | Action" required>
  - **Instruction**: Natural language description of the action to perform. Use `%variableName%` syntax to reference variables.
  - **Action**: A deterministic action to perform: 
  <Expandable title="Action">
    <ParamField path="selector" type="string" required>
      The selector (XPath, CSS selector, etc.) used to target the element
    </ParamField>
    <ParamField path="description" type="string" required>
      Description of the action - used for self-healing
    </ParamField>
    <ParamField path="method" type="string" required>
      The method used (e.g., "click", "fill", "type")
    </ParamField>
    <ParamField path="arguments" type="string[]" required>
      Arguments passed to the method
    </ParamField>
  </Expandable>
</ParamField>

<ParamField path="model" type="ModelConfiguration" optional>
  Configure the AI model to use for this action. Can be either:
  - A string in the format `"provider/model"` (e.g., `openai/gpt-5`, `google/gemini-2.5-flash`)
  - An object with detailed configuration

  <Expandable title="Model Configuration Object">
    <ParamField path="modelName" type="string" required>
      The model name (e.g., `anthropic/claude-sonnet-4-5`, `google/gemini-2.5-flash`)
    </ParamField>
    <ParamField path="apiKey" type="string" optional>
      API key for the model provider (overrides default)
    </ParamField>
    <ParamField path="baseURL" type="string" optional>
      Base URL for the API endpoint (for custom endpoints or proxies)
    </ParamField>
  </Expandable>
</ParamField>

<ParamField path="variables" type="Record<string, VariableValue>" optional>
  Key-value pairs for variable substitution using `%variableName%` syntax in your instruction. Variables are **not shared with LLM providers**, making them ideal for sensitive data like passwords and API keys.

  Values can be simple primitives (`string`, `number`, `boolean`) or rich objects with an optional description (`{ value, description? }`).

  **Example:**
  ```typescript
  // Simple values
  await stagehand.act("type %password% into the password field", {
    variables: { password: process.env.USER_PASSWORD }
  });

  // Rich values with descriptions
  await stagehand.act("type %password% into the password field", {
    variables: {
      password: {
        value: process.env.USER_PASSWORD,
        description: "The user's login password"
      }
    }
  });
  ```
</ParamField>

<ParamField path="timeout" type="number" optional>
  Maximum time in **milliseconds** to wait for the action to complete. Default varies by configuration.
</ParamField>

<ParamField path="page" type="PlaywrightPage | PuppeteerPage | PatchrightPage | Page" optional>
  Optional: Specify which page to perform the action on. Supports multiple browser automation libraries:
  - **Playwright**: Native Playwright Page objects
  - **Puppeteer**: Puppeteer Page objects
  - **Patchright**: Patchright Page objects
  - **Stagehand Page**: Stagehand's wrapped Page object

  If not specified, defaults to the current "active" page in your Stagehand instance.
</ParamField>

<ParamField path="serverCache" type="boolean" optional>
  Override the instance-level `serverCache` setting for this request. When `true`, enables server-side caching. When `false`, disables it.

  <Note>Only applies when `env` is `"BROWSERBASE"`. Has no effect in local environments.</Note>

  Defaults to the value set on the Stagehand constructor (which itself defaults to `true`).
</ParamField>

### Returns `Promise<ActResult>`

<ResponseField name="success" type="boolean" required>
  Whether the action completed successfully
</ResponseField>

<ResponseField name="message" type="string" required>
  Human-readable message describing the result
</ResponseField>

<ResponseField name="actionDescription" type="string" required>
  Instruction that was used to perform the action
</ResponseField>

<ResponseField name="actions" type="Action[]">
  Array of actions that were executed

  <Expandable title="Action">
    <ResponseField name="selector" type="string">
      The selector (XPath) used to target the element
    </ResponseField>
    <ResponseField name="description" type="string">
      Description of the action
    </ResponseField>
    <ResponseField name="method" type="string">
      The method used (e.g., "click", "fill", "type")
    </ResponseField>
    <ResponseField name="arguments" type="string[]">
      Arguments passed to the method
    </ResponseField>
  </Expandable>
</ResponseField>

<ResponseField name="cacheStatus" type='"HIT" | "MISS"' optional>
  Indicates whether the result was served from the server-side cache. Only present when running with `env: "BROWSERBASE"` and server-side caching is enabled.

  - **`"HIT"`** - Result was served from cache; no LLM tokens were consumed
  - **`"MISS"`** - Result was computed fresh and cached for future calls
</ResponseField>

**Example Response:**
```json
{
  "success": true,
  "message": "Action completed successfully",
  "actionDescription": "Clicked the submit button",
  "actions": [
    {
      "selector": "/html/body/form/button[1]",
      "description": "Submit button at bottom of form",
      "method": "click",
      "arguments": []
    }
  ]
}
```

### Built-in Support

<Note>
**Iframe and Shadow DOM interactions are supported out of the box.** Stagehand automatically handles iframe traversal and shadow DOM elements without requiring additional configuration or flags.
</Note>

### Code Examples

<Tabs>
<Tab title="Basic Usage">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

// Simple action
await stagehand.act("click the login button");
```

</Tab>
<Tab title="Variables">

```typescript
// Variables are NOT shared with LLM providers
await stagehand.act("type %username% into the email field", {
  variables: { username: "user@example.com" }
});

await stagehand.act("type %password% into the password field", {
  variables: { password: process.env.USER_PASSWORD }
});

await stagehand.act("click the login button");
```

</Tab>
<Tab title="Custom Model">

```typescript
// Using string format
await stagehand.act("choose 'Peach' from the favorite color dropdown", {
  model: "google/gemini-2.5-flash",
  timeout: 10000
});

// Using object format with custom configuration
await stagehand.act("choose 'Peach' from the favorite color dropdown", {
  model: {
    modelName: "google/gemini-2.5-flash",
    apiKey: process.env.GOOGLE_API_KEY,
    baseURL: "https://custom-api-endpoint.com"
  },
  timeout: 10000
});
```

</Tab>
<Tab title="Multi-Page">

```typescript
// Create multiple pages
const page1 = stagehand.context.pages()[0];
const page2 = await stagehand.context.newPage();

// Perform actions on specific pages
await stagehand.act("click the first link", { page: page1 });
await stagehand.act("click the second link", { page: page2 });
```

</Tab>
<Tab title="Caching">

<Tip>
**Auto-caching is now available in v3.** See the [caching guide](/v3/best-practices/caching) for more details.
</Tip>
```typescript
// Observe first to plan the action
const [action] = await stagehand.observe("click the submit button");

// Cache and reuse the action
if (action) {
  await stagehand.act(action);
}

// Later, reuse the same cached action
await stagehand.act(action);
```

</Tab>
</Tabs>

### Error Types

The following errors may be thrown by the `act()` method:

- **StagehandError** - Base class for all Stagehand-specific errors
- **StagehandElementNotFoundError** - Target element could not be located using the provided selector(s)
- **StagehandClickError** - Failed to click on the target element
- **StagehandEvalError** - Error occurred while evaluating JavaScript in the page context
- **StagehandDomProcessError** - Error occurred while processing the DOM
- **StagehandIframeError** - Unable to resolve iframe for the target element
- **ContentFrameNotFoundError** - Unable to obtain content frame for the selector
- **XPathResolutionError** - XPath does not resolve in the current page or frames
- **StagehandShadowRootMissingError** - No shadow root present on the resolved host element
- **LLMResponseError** - Error in LLM response processing
- **MissingLLMConfigurationError** - No LLM API key or client configured
- **UnsupportedModelError** - The specified model is not supported for this operation
- **InvalidAISDKModelFormatError** - Model string does not follow the required `provider/model` format

================================================
FILE: packages/docs/v3/references/agent.mdx
================================================
---
title: agent()
description: 'Complete API reference for the agent() method'
icon: 'robot'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Agent" icon="robot" href="/v3/basics/agent">
  See how to use agent() to create autonomous AI agents for multi-step browser workflows
</Card>
</CardGroup>

### Agent Creation

<Tabs>
<Tab title="TypeScript">

```typescript
// Create agent instance
const agent = stagehand.agent(config?: AgentConfig): AgentInstance
```

**AgentConfig Interface:**
```typescript
interface AgentConfig {
  systemPrompt?: string;
  integrations?: (Client | string)[];
  tools?: ToolSet;
  /** @deprecated Use `mode: "cua"` instead */
  cua?: boolean;
  model?: string | AgentModelConfig<string>;
  executionModel?: string | AgentModelConfig<string>;
  stream?: boolean; // Enable streaming mode (experimental)
  mode?: "dom" | "hybrid" | "cua"; // Tool mode
}

// AgentModelConfig for advanced configuration
type AgentModelConfig<TModelName extends string = string> = {
  modelName: TModelName;
} & Record<string, unknown>;
```

**AgentInstance Interface:**
```typescript
interface AgentInstance {
  execute: (instructionOrOptions: string | AgentExecuteOptions) => Promise<AgentResult>;
}
```

</Tab>

</Tabs>

### Agent Configuration

<ParamField path="systemPrompt" type="string" optional>
  Custom system prompt to provide to the agent. Overrides the default system prompt and defines agent behavior.
</ParamField>

<ParamField path="model" type="string | AgentModelConfig" optional>
  The model to use for agent functionality. Can be either:
  - A string in the format `"provider/model"` (e.g., `"openai/computer-use-preview"`, `"anthropic/claude-sonnet-4-20250514"`)
  - An object with `modelName` and additional provider-specific options

  **Available CUA Models:**
  - `"anthropic/claude-haiku-4-5-20251001"`
  - `"anthropic/claude-sonnet-4-6"`
  - `"anthropic/claude-sonnet-4-5-20250929"`
  - `"anthropic/claude-opus-4-5-20251101"`
  - `"anthropic/claude-opus-4-6"`
  - `"google/gemini-2.5-computer-use-preview-10-2025"`
  - `"google/gemini-3-flash-preview"`
  - `"google/gemini-3-pro-preview"`
  - `"microsoft/fara-7b"`
  - `"openai/computer-use-preview"`
  - `"openai/computer-use-preview-2025-03-11"`

  <Expandable title="AgentModelConfig Object">
    <ParamField path="modelName" type="string" required>
      The model name
    </ParamField>
    <ParamField path="[key: string]" type="unknown" optional>
      Additional provider-specific options (e.g., `apiKey`, `baseURL`)
    </ParamField>
  </Expandable>
</ParamField>

<ParamField path="executionModel" type="string | AgentModelConfig" optional>
  The model to use for tool execution (observe/act calls within agent tools). If not specified, inherits from the main model configuration.

  **Format:** `"provider/model"` (e.g., `"openai/gpt-4o-mini"`, `"google/gemini-2.0-flash-exp"`)
</ParamField>

<ParamField path="cua" type="boolean" optional>
  <Warning>**Deprecated:** Use `mode: "cua"` instead. This option will be removed in a future version.</Warning>
  
  Indicates whether Computer Use Agent (CUA) mode is enabled. When false, the agent uses standard tool-based operation instead of computer control.
</ParamField>

<ParamField path="integrations" type="(Client | string)[]" optional>
  MCP (Model Context Protocol) integrations for external tools and services.

  **Array of:** MCP server URLs (strings) or connected Client objects
</ParamField>

<ParamField path="tools" type="ToolSet" optional>
  Custom tool definitions to extend agent capabilities using the AI SDK ToolSet format.
</ParamField>

<ParamField path="stream" type="boolean" optional>
  Enable streaming mode for the agent. When `true`, `execute()` returns `AgentStreamResult` with `textStream` for incremental output. When `false` (default), `execute()` returns `AgentResult` after completion.
  
  **Default:** `false`
  
  <Warning>**Non-CUA agents only.** Requires `experimental: true`. Not available when `mode: "cua"`.</Warning>
</ParamField>

<ParamField path="mode" type='"dom" | "hybrid" | "cua"' optional>
  Tool mode for the agent. Determines which set of tools are available to the agent.
  
  **Modes:**
  - `"dom"` (default): Uses DOM-based tools (`act`, `fillForm`) for structured page interactions. Works with any model.
  - `"hybrid"`: Uses both DOM-based and coordinate-based tools (`act`, `click`, `type`, `dragAndDrop`, `clickAndHold`, `fillForm`) for visual/screenshot-based interactions. Requires models with reliable coordinate-based action capabilities.
  - `"cua"`: Uses Computer Use Agent (CUA) providers like Anthropic Claude, Google Gemini, or OpenAI for screenshot-based automation. This is the preferred way to enable CUA mode (replaces the deprecated `cua: true` option).
  
  **Default:** `"dom"`
  
  <Warning>
  **Hybrid Mode Model Requirements:** Only use hybrid mode with models that can reliably perform coordinate-based actions:
  - **Google:** `google/gemini-3-flash-preview`
  - **Anthropic:** `anthropic/claude-sonnet-4-20250514`, `anthropic/claude-sonnet-4-5-20250929`, `anthropic/claude-haiku-4-5-20251001`
  
  Requires `experimental: true` in Stagehand constructor.
  </Warning>
</ParamField>

### Execute Method

<Tabs>
<Tab title="Non-Streaming">

```typescript
// String instruction
await agent.execute(instruction: string): Promise<AgentResult>

// With options
await agent.execute(options: AgentExecuteOptions): Promise<AgentResult>
```

**AgentExecuteOptions Interface:**
```typescript
interface AgentExecuteOptions {
  instruction: string;
  maxSteps?: number;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  highlightCursor?: boolean;
  messages?: ModelMessage[]; // Continue from previous conversation (experimental)
  signal?: AbortSignal; // Cancel execution (experimental)
  excludeTools?: string[]; // Tools to exclude from this execution (experimental)
  output?: ZodObject; // Zod schema for structured output (experimental)
  callbacks?: AgentExecuteCallbacks;
}

interface AgentExecuteCallbacks {
  prepareStep?: PrepareStepFunction<ToolSet>;
  onStepFinish?: GenerateTextOnStepFinishCallback<ToolSet>;
}
```

</Tab>

<Tab title="Streaming">

```typescript
// With stream: true in AgentConfig
await agent.execute(options: AgentStreamExecuteOptions): Promise<AgentStreamResult>
```

**AgentStreamExecuteOptions Interface:**
```typescript
interface AgentStreamExecuteOptions {
  instruction: string;
  maxSteps?: number;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  highlightCursor?: boolean;
  messages?: ModelMessage[]; // Continue from previous conversation (experimental)
  signal?: AbortSignal; // Cancel execution (experimental)
  excludeTools?: string[]; // Tools to exclude from this execution (experimental)
  output?: ZodObject; // Zod schema for structured output (experimental)
  callbacks?: AgentStreamCallbacks;
}

interface AgentStreamCallbacks {
  prepareStep?: PrepareStepFunction<ToolSet>;
  onStepFinish?: StreamTextOnStepFinishCallback<ToolSet>;
  onChunk?: StreamTextOnChunkCallback<ToolSet>;
  onFinish?: StreamTextOnFinishCallback<ToolSet>;
  onError?: StreamTextOnErrorCallback;
  onAbort?: (event: { steps: Array<StepResult<ToolSet>> }) => void | Promise<void>;
}
```

</Tab>

</Tabs>

### Execute Parameters

<ParamField path="instruction" type="string" required>
  High-level task description in natural language.
</ParamField>

<ParamField path="maxSteps" type="number" optional>
  Maximum number of actions the agent can take before stopping.

  **Default:** `20`
</ParamField>

<ParamField path="page" type="PlaywrightPage | PuppeteerPage | PatchrightPage | Page" optional>
  Optional: Specify which page to perform the agent execution on. Supports multiple browser automation libraries:
  - **Playwright**: Native Playwright Page objects
  - **Puppeteer**: Puppeteer Page objects
  - **Patchright**: Patchright Page objects
  - **Stagehand Page**: Stagehand's wrapped Page object

  If not specified, defaults to the current "active" page in your Stagehand instance.
</ParamField>

<ParamField path="highlightCursor" type="boolean" optional>
  Whether to show a visual cursor on the page during agent execution. Useful for debugging and demonstrations.

  **Default:** `false`
</ParamField>

<ParamField path="messages" type="ModelMessage[]" optional>
  Previous conversation messages to continue from. Pass the `messages` from a previous `AgentResult` to continue that conversation.

  <Warning>**Non-CUA agents only.** Requires `experimental: true`. Not available when `mode: "cua"`.</Warning>
</ParamField>

<ParamField path="signal" type="AbortSignal" optional>
  An `AbortSignal` that can be used to cancel the agent execution. When aborted, the agent will stop and throw an `AgentAbortError`.

  <Warning>**Non-CUA agents only.** Requires `experimental: true`. Not available when `mode: "cua"`.</Warning>
</ParamField>

<ParamField path="excludeTools" type="string[]" optional>
  Tools to exclude from this execution. Pass an array of tool names to prevent the agent from using those tools.

  **Available tools by mode:**

  **DOM mode (default):** `act`, `fillForm`, `ariaTree`, `extract`, `goto`, `scroll`, `keys`, `navback`, `screenshot`, `think`, `wait`, `search`

  **Hybrid mode:** `click`, `type`, `dragAndDrop`, `clickAndHold`, `fillFormVision`, `act`, `ariaTree`, `extract`, `goto`, `scroll`, `keys`, `navback`, `screenshot`, `think`, `wait`, `search`

  <Warning>**Non-CUA agents only.** Requires `experimental: true`. Not available when `cua: true`.</Warning>
</ParamField>

<ParamField path="output" type="ZodObject" optional>
  A Zod schema defining structured output data to return when the task completes. The agent will populate this data based on the information it gathered during execution. The result will be available in `AgentResult.output`.

  <Warning>**Non-CUA agents only.** Requires `experimental: true`. Not available when `mode: "cua"`.</Warning>

  ```typescript
  import { z } from "zod";

  const result = await agent.execute({
    instruction: "Find the cheapest flight from NYC to LA",
    output: z.object({
      price: z.string().describe("The price of the flight"),
      airline: z.string().describe("The airline name"),
      departureTime: z.string().describe("Departure time"),
    }),
  });

  console.log(result.output); // { price: "$199", airline: "Delta", departureTime: "8:00 AM" }
  ```
</ParamField>

<ParamField path="callbacks" type="AgentExecuteCallbacks | AgentStreamCallbacks" optional>
  Callbacks to hook into the agent's execution lifecycle. The available callbacks depend on whether streaming is enabled.

  <Warning>**Non-CUA agents only.** Requires `experimental: true`. Not available when `mode: "cua"`.</Warning>

  <Expandable title="Non-Streaming Callbacks (AgentExecuteCallbacks)">
    <ParamField path="prepareStep" type="PrepareStepFunction<ToolSet>" optional>
      Called before each step to modify settings. You can change the model, tool choices, active tools, system prompt, and input messages for each step.
    </ParamField>
    <ParamField path="onStepFinish" type="GenerateTextOnStepFinishCallback<ToolSet>" optional>
      Called when each step (LLM call) completes. Provides access to tool calls, reasoning, and step results.
    </ParamField>
  </Expandable>

  <Expandable title="Streaming Callbacks (AgentStreamCallbacks)">
    <ParamField path="prepareStep" type="PrepareStepFunction<ToolSet>" optional>
      Called before each step to modify settings.
    </ParamField>
    <ParamField path="onStepFinish" type="StreamTextOnStepFinishCallback<ToolSet>" optional>
      Called when each step completes during streaming.
    </ParamField>
    <ParamField path="onChunk" type="StreamTextOnChunkCallback<ToolSet>" optional>
      Called for each chunk of the stream. Stream processing will pause until the callback promise resolves.
    </ParamField>
    <ParamField path="onFinish" type="StreamTextOnFinishCallback<ToolSet>" optional>
      Called when the stream finishes successfully.
    </ParamField>
    <ParamField path="onError" type="StreamTextOnErrorCallback" optional>
      Called when an error occurs during streaming.
    </ParamField>
    <ParamField path="onAbort" type="(event: { steps: StepResult[] }) => void | Promise<void>" optional>
      Called when the stream is aborted via the `signal` option.
    </ParamField>
  </Expandable>
</ParamField>

### Response

**Returns:** `Promise<AgentResult>` (non-streaming) or `Promise<AgentStreamResult>` (streaming)

<Tabs>
<Tab title="Non-Streaming">

**AgentResult Interface:**
```typescript
interface AgentResult {
  success: boolean;
  message: string;
  actions: AgentAction[];
  completed: boolean;
  metadata?: Record<string, unknown>;
  messages?: ModelMessage[]; // Conversation history for continuation (experimental)
  output?: Record<string, unknown>; // Structured output data (experimental)
  usage?: {
    input_tokens: number;
    output_tokens: number;
    reasoning_tokens?: number;
    cached_input_tokens?: number;
    inference_time_ms: number;
  };
}

// AgentAction can contain various tool-specific fields
interface AgentAction {
  type: string;
  reasoning?: string;
  taskCompleted?: boolean;
  action?: string;
  timeMs?: number;        // wait tool
  pageText?: string;      // ariaTree tool
  pageUrl?: string;       // ariaTree tool
  instruction?: string;   // various tools
  timestamp?: number;     // Action timestamp
  [key: string]: unknown; // Additional tool-specific fields
}
```

</Tab>

<Tab title="Streaming">

**AgentStreamResult Interface:**
```typescript
interface AgentStreamResult {
  // Async iterable of text chunks for incremental output
  textStream: AsyncIterable<string>;
  
  // Async iterable of all stream events (tool calls, messages, etc.)
  fullStream: AsyncIterable<StreamPart>;
  
  // Promise that resolves to the final AgentResult when streaming completes
  result: Promise<AgentResult>;
  
  // Additional properties from StreamTextResult<ToolSet, never>
  // See Vercel AI SDK documentation for full details
}
```

</Tab>
</Tabs>

<ResponseField name="success" type="boolean">
  Whether the task was completed successfully.
</ResponseField>

<ResponseField name="message" type="string">
  Description of the execution result and status.
</ResponseField>

<ResponseField name="actions" type="AgentAction[]">
  Array of individual actions taken during execution. Each action contains tool-specific data.
</ResponseField>

<ResponseField name="completed" type="boolean">
  Whether the agent believes the task is fully complete.
</ResponseField>

<ResponseField name="metadata" type="Record<string, unknown>" optional>
  Additional execution metadata and debugging information.
</ResponseField>

<ResponseField name="messages" type="ModelMessage[]" optional>
  The conversation messages from this execution. Pass these to a subsequent `execute()` call via the `messages` option to continue the conversation.

  <Note>**Non-CUA agents only.** Requires `experimental: true`.</Note>
</ResponseField>

<ResponseField name="output" type="Record<string, unknown>" optional>
  Custom structured output data extracted based on the `output` Zod schema provided in execute options. Only populated if an `output` schema was provided.

  <Note>**Non-CUA agents only.** Requires `experimental: true`.</Note>
</ResponseField>

<ResponseField name="usage" type="object" optional>
  Token usage and performance metrics.

  <Expandable title="Usage Metrics">
    <ResponseField name="input_tokens" type="number">
      Number of input tokens used
    </ResponseField>
    <ResponseField name="output_tokens" type="number">
      Number of output tokens generated
    </ResponseField>
    <ResponseField name="reasoning_tokens" type="number" optional>
      Number of reasoning tokens (if supported by the model)
    </ResponseField>
    <ResponseField name="cached_input_tokens" type="number" optional>
      Number of cached input tokens (if supported by the model)
    </ResponseField>
    <ResponseField name="inference_time_ms" type="number">
      Total inference time in milliseconds
    </ResponseField>
  </Expandable>
</ResponseField>

### Example Response
```json
{
  "success": true,
  "message": "Task completed successfully",
  "actions": [
    {
      "type": "act",
      "instruction": "click the submit button",
      "reasoning": "User requested to submit the form",
      "taskCompleted": false
    },
    {
      "type": "observe",
      "instruction": "check if submission was successful",
      "taskCompleted": true
    }
  ],
  "completed": true,
  "metadata": {
    "steps_taken": 2
  },
  "output": {
    "price": "$199",
    "airline": "Delta",
    "departureTime": "8:00 AM"
  },
  "usage": {
    "input_tokens": 1250,
    "output_tokens": 340,
    "reasoning_tokens": 42,
    "cached_input_tokens": 0,
    "inference_time_ms": 2500
  }
}
```

### Code Examples

<Tabs>
<Tab title="Basic Usage">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  model: "anthropic/claude-sonnet-4-20250514"
});
await stagehand.init();

const page = stagehand.context.pages()[0];
// Create agent with default configuration
const agent = stagehand.agent();

// Navigate to a page
await page.goto("https://www.google.com");

// Execute a task
const result = await agent.execute("Search for 'Stagehand automation' and click the first result");

console.log(result.message);
console.log(`Completed: ${result.completed}`);
console.log(`Actions taken: ${result.actions.length}`);
```

</Tab>
<Tab title="Custom Configuration">

```typescript
// Create agent with custom model and system prompt
const agent = stagehand.agent({
  model: "openai/computer-use-preview",
  systemPrompt: "You are a helpful assistant that can navigate websites efficiently. Always verify actions before proceeding.",
  executionModel: "openai/gpt-4o-mini"  // Use faster model for tool execution
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

const result = await agent.execute({
  instruction: "Fill out the contact form with test data",
  maxSteps: 10,
  highlightCursor: true
});
```

</Tab>
<Tab title="Advanced Model Config">

```typescript
// Using AgentModelConfig for advanced configuration
const agent = stagehand.agent({
  model: {
    modelName: "anthropic/claude-sonnet-4-20250514",
    apiKey: process.env.ANTHROPIC_API_KEY,
    baseURL: "https://custom-proxy.com/v1"
  }
});

const result = await agent.execute("Complete the checkout process");
```

</Tab>
<Tab title="Multi-Page">

```typescript
const page1 = stagehand.context.pages()[0];
const page2 = await stagehand.context.newPage();

const agent = stagehand.agent();

// Execute on specific page
await page2.goto("https://example.com/dashboard");
const result = await agent.execute({
  instruction: "Export the data table",
  page: page2
});
```

</Tab>
<Tab title="Streaming">

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for streaming
});
await stagehand.init();

const page = stagehand.context.pages()[0];
await page.goto("https://amazon.com");

// Create a streaming agent
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
  stream: true,
});

const streamResult = await agent.execute({
  instruction: "Search for headphones and find the best deal",
  maxSteps: 20,
});

// Stream text output incrementally
for await (const delta of streamResult.textStream) {
  process.stdout.write(delta);
}

// Get the final result
const finalResult = await streamResult.result;
console.log("Completed:", finalResult.completed);
```

</Tab>
<Tab title="Callbacks">

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true,
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

const result = await agent.execute({
  instruction: "Fill out the contact form",
  maxSteps: 10,
  callbacks: {
    prepareStep: async (stepContext) => {
      console.log(`Starting step ${stepContext.stepNumber}`);
      return stepContext;
    },
    onStepFinish: async (event) => {
      console.log(`Step finished: ${event.finishReason}`);
      if (event.toolCalls) {
        for (const tc of event.toolCalls) {
          console.log(`Tool: ${tc.toolName}`, tc.input);
        }
      }
    },
  },
});
```

</Tab>
<Tab title="Abort Signal">

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true,
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

const controller = new AbortController();

// Abort after 30 seconds
setTimeout(() => controller.abort("Timeout exceeded"), 30000);

try {
  const result = await agent.execute({
    instruction: "Complete a complex multi-step workflow",
    maxSteps: 50,
    signal: controller.signal,
  });
} catch (error) {
  if (error.name === "AgentAbortError") {
    console.log("Task cancelled:", error.message);
  }
}
```

</Tab>
<Tab title="Message Continuation">

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true,
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com/shop");

// First execution
const firstResult = await agent.execute({
  instruction: "Search for laptops and list the top 3 options",
  maxSteps: 10,
});

// Continue conversation with context from first run
const secondResult = await agent.execute({
  instruction: "Filter those results by price under $1000",
  maxSteps: 10,
  messages: firstResult.messages, // Pass previous messages
});

// Chain further with accumulated context
const thirdResult = await agent.execute({
  instruction: "Add the best-rated one to cart",
  maxSteps: 10,
  messages: secondResult.messages,
});

console.log("Final:", thirdResult.message);
```

</Tab>
<Tab title="MCP Integrations">

```typescript
import { Client } from "@modelcontextprotocol/sdk/client/index.js";

// Create agent with MCP integrations
const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-20250514",
  integrations: [
    "https://mcp-server.example.com",  // MCP server URL
    mcpClientInstance  // Or pre-connected Client object
  ]
});

const result = await agent.execute("Use the external tool to process this data");
```

</Tab>
<Tab title="Exclude Tools">

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for excludeTools
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

// Exclude specific tools from this execution
const result = await agent.execute({
  instruction: "Navigate the page and click buttons",
  maxSteps: 15,
  excludeTools: ["screenshot", "extract", "search"],
});

console.log("Completed:", result.completed);
```

</Tab>
<Tab title="Hybrid Mode">

```typescript
const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for hybrid mode
});
await stagehand.init();

// Create agent with hybrid mode for coordinate-based interactions
const agent = stagehand.agent({
  mode: "hybrid",
  model: "google/gemini-3-flash-preview", // Use a model that supports coordinate-based actions
});

const page = stagehand.context.pages()[0];
await page.goto("https://example.com/form");

const result = await agent.execute({
  instruction: "Fill out the registration form with test data",
  maxSteps: 15,
  highlightCursor: true, // Enabled by default in hybrid mode
});

console.log("Completed:", result.completed);
```

</Tab>
<Tab title="Structured Output">

```typescript
import { z } from "zod";

const stagehand = new Stagehand({
  env: "LOCAL",
  experimental: true, // Required for structured output
});
await stagehand.init();

const agent = stagehand.agent({
  model: "anthropic/claude-sonnet-4-5-20250929",
});

const page = stagehand.context.pages()[0];
await page.goto("https://www.google.com/flights");

// Define output schema to receive structured data
const result = await agent.execute({
  instruction: "Find the cheapest flight from NYC to LA for next week",
  maxSteps: 20,
  output: z.object({
    price: z.string().describe("The price of the flight"),
    airline: z.string().describe("The airline name"),
    departureTime: z.string().describe("Departure time"),
    arrivalTime: z.string().describe("Arrival time"),
    flightNumber: z.string().optional().describe("Flight number if available"),
  }),
});

// Access the structured output
console.log("Flight found:");
console.log(`  Price: ${result.output?.price}`);
console.log(`  Airline: ${result.output?.airline}`);
console.log(`  Departure: ${result.output?.departureTime}`);
console.log(`  Arrival: ${result.output?.arrivalTime}`);
```

</Tab>
<Tab title="Custom Tools">

```typescript
import { tool } from "@browserbasehq/stagehand";
import { z } from "zod";

// Define custom tools using the tool helper from @browserbasehq/stagehand
const customTools = {
  calculateTotal: tool({
    description: "Calculate the total of items in cart",
    parameters: z.object({
      items: z.array(z.object({
        price: z.number(),
        quantity: z.number()
      }))
    }),
    execute: async ({ items }) => {
      const total = items.reduce((sum, item) => sum + (item.price * item.quantity), 0);
      return { total };
    }
  })
};

const agent = stagehand.agent({
  model: "openai/computer-use-preview",
  tools: customTools
});

const result = await agent.execute("Calculate the total cost of items in the shopping cart");
```

</Tab>
</Tabs>

### Error Types

The following errors may be thrown by the `agent()` method:

- **StagehandError** - Base class for all Stagehand-specific errors
- **StagehandInitError** - Agent was not properly initialized
- **MissingLLMConfigurationError** - No LLM API key or client configured
- **UnsupportedModelError** - The specified model is not supported for agent functionality
- **UnsupportedModelProviderError** - The specified model provider is not supported
- **InvalidAISDKModelFormatError** - Model string does not follow the required `provider/model` format
- **MCPConnectionError** - Failed to connect to MCP server
- **StagehandDefaultError** - General execution error with detailed message
- **AgentAbortError** - Thrown when agent execution is cancelled via an `AbortSignal`
- **StreamingCallbacksInNonStreamingModeError** - Thrown when streaming-only callbacks (`onChunk`, `onFinish`, `onError`, `onAbort`) are used without `stream: true`
- **ExperimentalNotConfiguredError** - Thrown when experimental features (callbacks, signal, messages, streaming) are used without `experimental: true` in Stagehand constructor

================================================
FILE: packages/docs/v3/references/context.mdx
================================================
---
title: context
description: 'Complete API reference for the browser context'
icon: 'window'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Stagehand" icon="wand-magic-sparkles" href="/v3/references/stagehand">
  Learn about the main Stagehand object
</Card>
</CardGroup>

## Overview

The `context` object manages the browser context, which is a container for multiple pages (tabs). It provides methods for creating new pages, accessing existing pages, and managing which page is currently active.

Access the context through your Stagehand instance:

```typescript
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const context = stagehand.context;
```

## Methods

### newPage()

Create a new page (tab) in the browser.

```typescript
await context.newPage(url?: string): Promise<Page>
```

<ParamField path="url" type="string" optional>
  The URL to navigate to in the new page.

  **Default:** `"about:blank"`
</ParamField>

**Returns:** `Promise<Page>` - The newly created page object.

The new page is automatically set as the active page.

### pages()

Get all open pages in the browser context.

```typescript
context.pages(): Page[]
```

**Returns:** `Page[]` - Array of all open pages, ordered from oldest to newest.

### activePage()

Get the currently active page.

```typescript
context.activePage(): Page | undefined
```

**Returns:** `Page | undefined` - The most recently used page, or `undefined` if no pages exist.

The active page is determined by:
1. Most recently interacted with page
2. Most recently created page if no interaction history
3. `undefined` if all pages have been closed

### setActivePage()

Set a specific page as the active page.

```typescript
context.setActivePage(page: Page): void
```

<ParamField path="page" type="Page" required>
  The page to set as active. Must be a page that exists in this context.
</ParamField>

This method:
- Marks the page as most recently used
- Brings the tab to the foreground (in headed mode)
- Makes it the default page for subsequent operations

### addInitScript()

Inject JavaScript that runs before any page scripts on every navigation.

```typescript
await context.addInitScript<Arg>(
  script: string | { path?: string; content?: string } | ((arg: Arg) => unknown),
  arg?: Arg,
): Promise<void>
```

<ParamField
  path="script"
  type="string | { path?: string; content?: string } | (arg: Arg) => unknown"
  required
>
  Provide the script to inject. Pass raw source code, reference a file on disk,
  or supply a function that Stagehand serializes before sending to the browser.
</ParamField>

<ParamField path="arg" type="Arg" optional>
  Extra data that is JSON-serialized and passed to your function. Only supported
  when `script` is a function.
</ParamField>

This method:
- Runs at document start, and installs the script on all currently open pages and replays it on every
  navigation of those pages
- Automatically applies the same script to any pages created after calling
  `context.addInitScript()`
- Allows referencing preload files via `{ path: "./preloads/dom-hooks.js" }`,
  mirroring Playwright's `sourceURL` behavior for readable stack traces

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Add some JavaScript to automatically accept alert dialogs
await context.addInitScript(() => {
   window.alert = () => {};
   window.confirm = () => true;
   window.prompt = () => '';
 });
```

### setExtraHTTPHeaders()

Set HTTP headers that will be included in every request made by all pages in the browser context.

```typescript
await context.setExtraHTTPHeaders(headers: Record<string, string>): Promise<void>
```

<ParamField path="headers" type="Record<string, string>" required>
  A plain object of header name–value pairs. All values must be strings.
</ParamField>

This method:
- Applies the headers to all existing pages in the context immediately
- Automatically applies the same headers to any pages created after calling `setExtraHTTPHeaders()`
- Calling it again replaces all previously set extra headers (it does not merge)
- To clear all extra headers, pass an empty object: `await context.setExtraHTTPHeaders({})`

<Note>
Headers set via `context.setExtraHTTPHeaders()` are context-wide. They apply to every network request from every page in the context, including navigation requests, XHR/fetch calls, and subresource loads.
</Note>

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Set custom headers for all requests
await context.setExtraHTTPHeaders({
  "X-Custom-Token": "my-secret-token",
  "Accept-Language": "en-US",
});

// All subsequent requests from any page in this context
// will include these headers
const page = await context.newPage("https://example.com");
```

### cookies()

Retrieve browser cookies, optionally filtered by URL(s).

```typescript
await context.cookies(urls?: string | string[]): Promise<Cookie[]>
```

<ParamField path="urls" type="string | string[]" optional>
  A single URL or array of URLs to filter cookies by. When provided, only cookies that match the domain, path, and secure requirements of the given URLs are returned.

  **Default:** Returns all cookies when omitted.
</ParamField>

**Returns:** `Promise<Cookie[]>` - Array of cookie objects.

```typescript
// Get all cookies
const allCookies = await context.cookies();

// Get cookies for a specific URL
const siteCookies = await context.cookies("https://example.com");

// Get cookies for multiple URLs
const cookies = await context.cookies([
  "https://example.com",
  "https://api.example.com",
]);
```

### addCookies()

Set one or more cookies in the browser context.

```typescript
await context.addCookies(cookies: CookieParam[]): Promise<void>
```

<ParamField path="cookies" type="CookieParam[]" required>
  Array of cookie parameters to set. Each cookie must provide either `url` or both `domain` and `path` — providing both `url` and `domain` (or `url` and `path`) will throw a validation error.
</ParamField>

<Note>
Cookies set via `context.addCookies()` are shared across all pages in the context, scoped by domain and path.
</Note>

```typescript
// Set a cookie using a URL
await context.addCookies([
  {
    name: "session",
    value: "abc123",
    url: "https://example.com",
  },
]);

// Set a cookie using domain and path
await context.addCookies([
  {
    name: "token",
    value: "xyz789",
    domain: ".example.com",
    path: "/",
    secure: true,
    httpOnly: true,
    sameSite: "Strict",
  },
]);
```

<Warning>
Setting `sameSite: "None"` requires `secure: true`. Stagehand will throw a validation error if this requirement is not met.
</Warning>

### clearCookies()

Clear cookies from the browser context. Can clear all cookies or selectively filter by name, domain, or path.

```typescript
await context.clearCookies(options?: ClearCookieOptions): Promise<void>
```

<ParamField path="options" type="ClearCookieOptions" optional>
  Filter options to selectively clear cookies. When omitted, all cookies are cleared.

  <Expandable title="ClearCookieOptions">
    <ParamField path="name" type="string | RegExp" optional>
      Match cookies by name. Supports exact string match or RegExp.
    </ParamField>

    <ParamField path="domain" type="string | RegExp" optional>
      Match cookies by domain. Supports exact string match or RegExp.
    </ParamField>

    <ParamField path="path" type="string | RegExp" optional>
      Match cookies by path. Supports exact string match or RegExp.
    </ParamField>
  </Expandable>
</ParamField>

```typescript
// Clear all cookies
await context.clearCookies();

// Clear cookies by exact name
await context.clearCookies({ name: "session" });

// Clear cookies by domain pattern
await context.clearCookies({ domain: /\.example\.com$/ });

// Combine filters (a cookie must match ALL provided filters to be cleared)
await context.clearCookies({
  name: "token",
  domain: ".example.com",
});
```

### close()

Close the browser context and all associated pages.

```typescript
await context.close(): Promise<void>
```

This method:
- Closes the CDP connection
- Cleans up all pages
- Clears all internal mappings

**Note:** This is typically called internally by `stagehand.close()`. You usually don't need to call this directly.

## Code Examples

<Tabs>
<Tab title="Basic Usage">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const context = stagehand.context;

// Create a new page
const page1 = await context.newPage("https://example.com");
console.log("Created page 1");

// Create another page
const page2 = await context.newPage("https://another-site.com");
console.log("Created page 2");

// Get all pages
const allPages = context.pages();
console.log(`Total pages: ${allPages.length}`);

await stagehand.close();
```

</Tab>
<Tab title="Multi-Page Workflow">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Start with main page
const mainPage = context.pages()[0];
await mainPage.goto("https://example.com");

// Open additional pages
const dashboardPage = await context.newPage("https://example.com/dashboard");
const settingsPage = await context.newPage("https://example.com/settings");

// Work with specific page
context.setActivePage(dashboardPage);
await stagehand.act("click the export button");

// Switch to another page
context.setActivePage(settingsPage);
await stagehand.act("enable notifications");

// Back to main page
context.setActivePage(mainPage);
await stagehand.act("click the logout button");

await stagehand.close();
```

</Tab>
<Tab title="Page Management">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Create multiple pages
const pages = await Promise.all([
  context.newPage("https://site1.com"),
  context.newPage("https://site2.com"),
  context.newPage("https://site3.com"),
]);

console.log(`Opened ${pages.length} pages`);

// Get the active page
const active = context.activePage();
console.log(`Active page URL: ${active?.url()}`);

// Iterate through all pages
for (const page of context.pages()) {
  console.log(`Page URL: ${page.url()}`);
  console.log(`Page title: ${await page.title()}`);
}

await stagehand.close();
```

</Tab>
<Tab title="Parallel Operations">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from "zod";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Create pages for different sites
const page1 = await context.newPage("https://site1.com");
const page2 = await context.newPage("https://site2.com");
const page3 = await context.newPage("https://site3.com");

const schema = z.object({
  title: z.string(),
  description: z.string()
});

// Extract data from all pages in parallel
const results = await Promise.all([
  stagehand.extract("get page info", schema, { page: page1 }),
  stagehand.extract("get page info", schema, { page: page2 }),
  stagehand.extract("get page info", schema, { page: page3 })
]);

console.log("Extracted data:", results);

await stagehand.close();
```

</Tab>
<Tab title="Active Page Tracking">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Create pages
const homePage = await context.newPage("https://example.com");
const aboutPage = await context.newPage("https://example.com/about");
const contactPage = await context.newPage("https://example.com/contact");

// The last created page (contactPage) is now active
console.log("Active:", context.activePage()?.url());
// Output: "https://example.com/contact"

// Switch to home page
context.setActivePage(homePage);
console.log("Active:", context.activePage()?.url());
// Output: "https://example.com"

// Now act on the active page (homePage)
await stagehand.act("click the header link");

await stagehand.close();
```

</Tab>
<Tab title="Custom HTTP Headers">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;

// Set authorization headers for all requests
await context.setExtraHTTPHeaders({
  Authorization: "Bearer my-api-token",
});

// Navigate — the headers are sent with every request
const page = context.pages()[0];
await page.goto("https://api.example.com/dashboard");

// Headers also apply to new pages
const page2 = await context.newPage("https://api.example.com/settings");

// Replace headers (previous headers are removed)
await context.setExtraHTTPHeaders({
  Authorization: "Bearer refreshed-token",
  "X-Request-Id": "abc-123",
});

await stagehand.close();
```

</Tab>
<Tab title="Cookie Management">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;
const page = context.pages()[0];

await page.goto("https://example.com");

// Set authentication cookies
await context.addCookies([
  {
    name: "session_id",
    value: "abc123",
    domain: ".example.com",
    path: "/",
    httpOnly: true,
    secure: true,
    sameSite: "Lax",
  },
]);

// Read cookies back
const cookies = await context.cookies("https://example.com");
console.log("Cookies:", cookies);

// Clear specific cookies
await context.clearCookies({ name: "session_id" });

// Clear all cookies
await context.clearCookies();

await stagehand.close();
```

</Tab>
</Tabs>

## Working with Active Pages

The context tracks which page is currently active:

```typescript
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();

// Get the current active page
const activePage = stagehand.context.activePage();

// Create a new page - it becomes active
const newPage = await stagehand.context.newPage();

// Now context.activePage() returns newPage
await newPage.goto("https://example.com");
```

## Relationship Between Context and Page

- **Context** manages the browser-level state and multiple pages
- **Page** represents a single tab/window with content
- Creating a new page via `context.newPage()` automatically sets it as active
- You can explicitly control the active page with `context.setActivePage()`
- Use `context.activePage()` to get the currently active page

```typescript
// Get the active page
const activePage = stagehand.context.activePage();

// Or get the first page directly
const firstPage = stagehand.context.pages()[0];
```

## Best Practices

1. **Create pages explicitly** - Use `context.newPage()` instead of relying on popups or window.open
2. **Track page references** - Store page objects in variables for easier management
3. **Set active page before operations** - Ensure the correct page is active before calling Stagehand methods
4. **Clean up properly** - Call `stagehand.close()` to close all pages and the context
5. **Handle page order** - Remember that `context.pages()` returns pages in creation order
6. **Use parallel operations** - Work with multiple pages simultaneously for better performance

## Common Patterns

### Tab Management

```typescript
// Keep track of pages by purpose
const pages = {
  home: await context.newPage("https://example.com"),
  dashboard: await context.newPage("https://example.com/dashboard"),
  settings: await context.newPage("https://example.com/settings")
};

// Switch between tabs
context.setActivePage(pages.dashboard);
await stagehand.act("view report");

context.setActivePage(pages.settings);
await stagehand.act("update preferences");
```

### Bulk Data Collection

```typescript
const urls = [
  "https://site1.com",
  "https://site2.com",
  "https://site3.com"
];

// Open all pages
const pages = await Promise.all(
  urls.map(url => context.newPage(url))
);

// Extract data from each
const data = await Promise.all(
  pages.map(page => stagehand.extract("get data", schema, { page }))
);
```

### Conditional Page Management

```typescript
// Only create a page if needed
if (needsDashboard) {
  const dashboard = await context.newPage("https://example.com/dashboard");
  context.setActivePage(dashboard);
  await stagehand.act("generate report");
}

// Check if we have multiple pages
if (context.pages().length > 1) {
  console.log("Multiple tabs open");
}
```

## Error Handling

Context methods may throw the following errors:

- **Timeout errors** - `newPage()` timeout waiting for page to attach
- **CDP errors** - Connection errors with Chrome DevTools Protocol
- **Invalid page errors** - Attempting to set an active page that doesn't exist in the context
- **StagehandSetExtraHTTPHeadersError** - `setExtraHTTPHeaders()` failed to apply headers to one or more sessions. The error includes a `failures` array with per-session details

Always handle errors appropriately:

```typescript
try {
  const page = await context.newPage("https://example.com");
} catch (error) {
  console.error("Failed to create page:", error.message);
}
```

## Type Definitions

```typescript
interface V3Context {
  newPage(url?: string): Promise<Page>;
  pages(): Page[];
  activePage(): Page | undefined;
  setActivePage(page: Page): void;
  setExtraHTTPHeaders(headers: Record<string, string>): Promise<void>;
  cookies(urls?: string | string[]): Promise<Cookie[]>;
  addCookies(cookies: CookieParam[]): Promise<void>;
  clearCookies(options?: ClearCookieOptions): Promise<void>;
  close(): Promise<void>;
}

interface Cookie {
  name: string;
  value: string;
  domain: string;
  path: string;
  /** Unix time in seconds. -1 means session cookie. */
  expires: number;
  httpOnly: boolean;
  secure: boolean;
  sameSite: "Strict" | "Lax" | "None";
}

interface CookieParam {
  name: string;
  value: string;
  /** If provided, domain/path/secure are derived from this URL. */
  url?: string;
  domain?: string;
  path?: string;
  /** Unix timestamp in seconds. -1 or omitted = session cookie. */
  expires?: number;
  httpOnly?: boolean;
  secure?: boolean;
  sameSite?: "Strict" | "Lax" | "None";
}

interface ClearCookieOptions {
  name?: string | RegExp;
  domain?: string | RegExp;
  path?: string | RegExp;
}
```


================================================
FILE: packages/docs/v3/references/deeplocator.mdx
================================================
---
title: deepLocator
description: 'Complete API reference for the deepLocator method'
icon: 'layer-group'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Locator" icon="crosshairs" href="/v3/references/locator">
  Learn about the standard Locator class
</Card>
</CardGroup>

## Overview

The `deepLocator()` method creates a special locator that can traverse iframe boundaries and shadow DOM using a simplified syntax. It automatically resolves the correct frame for each operation, making cross-frame interactions seamless.

Access via the page object:

```typescript
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

// Deep locator with iframe traversal
const button = page.deepLocator("iframe#myframe >> button.submit");
await button.click();
```

## Syntax

### page.deepLocator()

Create a deep locator that can cross iframe and shadow DOM boundaries.

```typescript
page.deepLocator(selector: string): DeepLocatorDelegate
```

<ParamField path="selector" type="string" required>
  Selector string with optional iframe hop notation (`>>`).

  Supports:
  - **CSS selectors** - Standard CSS syntax
  - **XPath** - Prefix with `xpath=` or start with `/`
  - **Hop notation** - Use `>>` to traverse into iframes
  - **Deep XPath** - Automatically handles iframe steps in XPath
</ParamField>

**Returns:** `DeepLocatorDelegate` - A locator-like object that resolves frames on each action.

## Hop Notation

The `>>` operator allows you to traverse into iframes in a readable way:

```typescript
// Syntax: parent-selector >> child-selector >> target-selector
page.deepLocator("iframe#outer >> iframe.inner >> button")
```

Each segment before `>>` represents an iframe to traverse into. The final segment is the target element.

### Examples

```typescript
// Single iframe hop
page.deepLocator("iframe#payment >> input#card-number")

// Multiple iframe hops
page.deepLocator("iframe#level1 >> iframe#level2 >> div.content")

// XPath with hops
page.deepLocator("//iframe[@id='myframe'] >> //button[@class='submit']")

// CSS with XPath target
page.deepLocator("iframe.widget >> xpath=//div[@data-id='123']")
```

## Deep XPath

When using XPath, `deepLocator` automatically recognizes `iframe` steps and traverses into them:

```typescript
// Automatically traverses into iframes
page.deepLocator("//iframe//button")
page.deepLocator("//iframe[@id='myframe']//input[@name='email']")
page.deepLocator("//iframe[1]//iframe[2]//div[@class='target']")
```

The locator intelligently parses the XPath, identifies iframe boundaries, and resolves the correct frame for the final selector.

## Methods

`DeepLocatorDelegate` provides the same API as `Locator`, with automatic frame resolution:

### Interaction Methods

All interaction methods from [`Locator`](/v3/references/locator) are available:

- **`click(options?)`** - Click the element
- **`fill(value)`** - Fill an input
- **`type(text, options?)`** - Type text
- **`hover()`** - Hover over element
- **`selectOption(values)`** - Select dropdown options
- **`scrollTo(percent)`** - Scroll element

### State Methods

- **`isVisible()`** - Check visibility
- **`isChecked()`** - Check checkbox state
- **`inputValue()`** - Get input value
- **`textContent()`** - Get text content
- **`innerText()`** - Get visible text
- **`innerHtml()`** - Get HTML content

### Selection Methods

- **`count()`** - Count matching elements
- **`nth(index)`** - Select by index
- **`first()`** - Get first element

### Utility Methods

- **`highlight(options?)`** - Highlight element
- **`centroid()`** - Get center coordinates
- **`backendNodeId()`** - Get DOM node ID
- **`sendClickEvent(options?)`** - Dispatch click event

All methods work identically to `Locator`, but automatically resolve the correct frame before executing.

## Code Examples

<Tabs>
<Tab title="Basic Iframe Traversal">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

// Click button inside iframe
const button = page.deepLocator("iframe#widget >> button.submit");
await button.click();

// Fill input in nested iframe
const input = page.deepLocator("iframe#outer >> iframe#inner >> input#email");
await input.fill("user@example.com");

await stagehand.close();
```

</Tab>
<Tab title="Multiple Iframes">

```typescript
// Three-level iframe nesting
await page.deepLocator(
  "iframe#level1 >> iframe#level2 >> iframe#level3 >> div.target"
).click();

// Different selectors at each level
await page.deepLocator(
  "iframe.container >> #payment-frame >> input[name=cardNumber]"
).fill("4111111111111111");

// Mixed CSS and XPath
await page.deepLocator(
  "iframe.widget >> xpath=//button[contains(text(), 'Submit')]"
).click();
```

</Tab>
<Tab title="Deep XPath">

```typescript
// Simple iframe traversal with XPath
const content = page.deepLocator("//iframe//div[@class='content']");
const text = await content.textContent();

// Multiple iframe levels
const button = page.deepLocator(
  "//iframe[@id='outer']//iframe[@class='inner']//button"
);
await button.click();

// XPath with predicates
const input = page.deepLocator(
  "//iframe[1]//form[@id='myform']//input[@type='text'][1]"
);
await input.fill("test value");
```

</Tab>
<Tab title="Element Selection">

```typescript
// Count elements across iframes
const buttons = page.deepLocator("iframe#widget >> button");
const count = await buttons.count();
console.log(`Found ${count} buttons in iframe`);

// Select specific element
const firstButton = buttons.first();
await firstButton.click();

const thirdButton = buttons.nth(2);
await thirdButton.click();

// Get text from all elements
for (let i = 0; i < count; i++) {
  const btn = buttons.nth(i);
  const text = await btn.innerText();
  console.log(`Button ${i}:`, text);
}
```

</Tab>
<Tab title="Payment Forms">

```typescript
// Common use case: payment iframe
const paymentFrame = "iframe#stripe-payment-element";

// Fill card details
await page.deepLocator(`${paymentFrame} >> input[name="cardnumber"]`)
  .fill("4242424242424242");

await page.deepLocator(`${paymentFrame} >> input[name="exp-date"]`)
  .fill("12/25");

await page.deepLocator(`${paymentFrame} >> input[name="cvc"]`)
  .fill("123");

await page.deepLocator(`${paymentFrame} >> input[name="postal"]`)
  .fill("12345");

// Submit
await page.deepLocator(`${paymentFrame} >> button[type="submit"]`)
  .click();
```

</Tab>
<Tab title="State Checks">

```typescript
// Check visibility across iframe
const modal = page.deepLocator("iframe#app >> .modal");
if (await modal.isVisible()) {
  console.log("Modal is visible in iframe");
}

// Get values from iframe inputs
const email = page.deepLocator("iframe#form >> input#email");
const value = await email.inputValue();
console.log("Email value:", value);

// Check checkbox in iframe
const checkbox = page.deepLocator("iframe#settings >> input#subscribe");
const checked = await checkbox.isChecked();
console.log("Subscribed:", checked);

// Highlight element in iframe for debugging
await page.deepLocator("iframe#widget >> .error-message")
  .highlight({ durationMs: 2000 });
```

</Tab>
</Tabs>

## Comparison with Standard Locator

### Standard Locator (Single Frame)

```typescript
// Only works in the main frame
const button = page.locator("button.submit");
await button.click();

// Cannot access elements inside iframes
const iframeButton = page.locator("iframe >> button"); // ❌ Won't work
```

### Deep Locator (Cross-Frame)

```typescript
// Works across iframe boundaries
const button = page.deepLocator("iframe#widget >> button.submit");
await button.click(); // ✅ Automatically traverses into iframe

// Can handle nested iframes
const nested = page.deepLocator("iframe#a >> iframe#b >> button");
await nested.click(); // ✅ Handles multiple levels
```

## When to Use deepLocator

Use `deepLocator()` when:

1. **Targeting elements inside iframes** - Payment forms, embedded widgets, third-party content
2. **Working with nested iframes** - Multiple levels of iframe nesting
3. **XPath crosses iframe boundaries** - When XPath naturally includes iframe steps
4. **Simpler syntax preferred** - Use `>>` instead of manual frame switching

Use standard `locator()` when:

1. **Elements are in main frame** - No iframe traversal needed
2. **Performance critical** - Standard locator is slightly faster (no frame resolution)
3. **Working with frame references** - You already have the frame object

## Best Practices

1. **Use specific selectors** - Make each segment unique to avoid ambiguity
2. **Keep hop chains short** - Simpler is better for maintainability
3. **Name your iframes** - Use IDs or classes on iframes for easier targeting
4. **Test incrementally** - Verify each segment works before adding more
5. **Cache selectors** - Store complex selectors in variables for reuse
6. **Use highlight() for debugging** - Verify you're targeting the right element

## Common Patterns

### Named Iframe References

```typescript
// Define iframe selectors
const PAYMENT_FRAME = "iframe#stripe-payment";
const WIDGET_FRAME = "iframe.embedded-widget";

// Use in deep locators
await page.deepLocator(`${PAYMENT_FRAME} >> input#card`).fill("4242");
await page.deepLocator(`${WIDGET_FRAME} >> button`).click();
```

### Conditional Iframe Interaction

```typescript
const errorInIframe = page.deepLocator("iframe#form >> .error-message");
if (await errorInIframe.isVisible()) {
  const errorText = await errorInIframe.textContent();
  console.error("Form error:", errorText);
}
```

### Dynamic Frame Selection

```typescript
// Select iframe by attribute
const frameSelector = `iframe[data-widget-id="${widgetId}"]`;
const button = page.deepLocator(`${frameSelector} >> button.action`);
await button.click();
```

## Error Handling

Deep locator operations may throw:

- **Element not found** - Selector doesn't match in the target frame
- **Frame not found** - Iframe selector doesn't resolve
- **Timeout errors** - Frame or element resolution timed out
- **Invalid selector** - Malformed selector syntax

Handle errors appropriately:

```typescript
try {
  await page.deepLocator("iframe#widget >> button").click();
} catch (error) {
  console.error("Deep locator failed:", error.message);
  // Fallback or retry logic
}
```

## Advanced Usage

### Combining with Page Methods

```typescript
// Navigate then use deep locator
await page.goto("https://example.com");
await page.waitForLoadState("networkidle");

const iframeButton = page.deepLocator("iframe#app >> button");
await iframeButton.click();
```

### With AI-Powered Methods

```typescript
// Use observe to find elements in iframes
const actions = await stagehand.observe("find buttons in the payment iframe");

// Then use deep locator for precise interaction
await page.deepLocator("iframe#payment >> button.submit").click();
```

## Technical Details

### How It Works

1. **Parse selector** - Splits on `>>` or parses XPath for iframe steps
2. **Build frame chain** - Creates FrameLocator chain for each iframe segment
3. **Resolve final frame** - Navigates through frames to find target frame
4. **Create locator** - Returns a locator in the correct frame context
5. **Lazy execution** - Frame resolution happens fresh on each action

### Frame Resolution

Deep locators use the internal `FrameLocator` and `resolveLocatorWithHops` logic to:

- Track frame hierarchies
- Handle OOPIF (out-of-process iframes)
- Support shadow DOM piercing
- Maintain frame references during navigation

## Type Definitions

```typescript
interface DeepLocatorDelegate {
  // Actions
  click(options?: { button?: MouseButton; clickCount?: number }): Promise<void>;
  fill(value: string): Promise<void>;
  type(text: string, options?: { delay?: number }): Promise<void>;
  hover(): Promise<void>;
  selectOption(values: string | string[]): Promise<string[]>;
  scrollTo(percent: number | string): Promise<void>;

  // State
  isVisible(): Promise<boolean>;
  isChecked(): Promise<boolean>;
  inputValue(): Promise<string>;
  textContent(): Promise<string>;
  innerText(): Promise<string>;
  innerHtml(): Promise<string>;

  // Selection
  count(): Promise<number>;
  nth(index: number): DeepLocatorDelegate;
  first(): DeepLocatorDelegate;

  // Utilities
  highlight(options?: HighlightOptions): Promise<void>;
  centroid(): Promise<{ x: number; y: number }>;
  backendNodeId(): Promise<BackendNodeId>;
  sendClickEvent(options?: EventOptions): Promise<void>;
}
```


================================================
FILE: packages/docs/v3/references/extract.mdx
================================================
---
title: extract()
description: 'Complete API reference for the extract() method'
icon: 'ufo-beam'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Extract" icon="ufo-beam" href="/v3/basics/extract">
  See how to use extract() to extract structured data from web pages
</Card>
</CardGroup>

### Method Signatures

<Tabs>
<Tab title="TypeScript">

```typescript
// No parameters (raw page content)
await stagehand.extract(): Promise<{ pageText: string }>

// Options only (for example, for targeted extraction)
await stagehand.extract(options: ExtractOptions): Promise<{ pageText: string }>

// String instruction only
await stagehand.extract(instruction: string): Promise<{ extraction: string }>

// With schema
await stagehand.extract<T extends ZodTypeAny>(
  instruction: string,
  schema: T,
  options?: ExtractOptions
): Promise<z.infer<T>>
```

**ExtractOptions Interface:**
```typescript
interface ExtractOptions {
  model?: ModelConfiguration;
  timeout?: number;
  selector?: string;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  serverCache?: boolean;
}

// ModelConfiguration can be either a string or an object
type ModelConfiguration =
  | string  // Format: "provider/model" (e.g., "openai/gpt-5-mini", "anthropic/claude-sonnet-4-5")
  | {
      modelName: string;  // The model name
      apiKey?: string;    // Optional: API key override
      baseURL?: string;   // Optional: Base URL override
      // Additional provider-specific options
    }
```

</Tab>

</Tabs>

### Parameters

<ParamField path="instruction" type="string" optional>
  Natural language description of what data to extract. If omitted with no schema, returns raw page text.
</ParamField>

<ParamField path="schema" type="ZodTypeAny" optional>
  Zod schema defining the structure of data to extract. Ensures type safety and validation. The return type is automatically inferred from the schema.
</ParamField>

<ParamField path="model" type="ModelConfiguration" optional>
  Configure the AI model to use for this action. Can be either:
  - A string in the format `"provider/model"` (e.g., `openai/gpt-5`, `google/gemini-2.5-flash`)
  - An object with detailed configuration

  <Expandable title="Model Configuration Object">
    <ParamField path="modelName" type="string" required>
      The model name (e.g., `anthropic/claude-sonnet-4-5`, `google/gemini-2.5-flash`)
    </ParamField>
    <ParamField path="apiKey" type="string" optional>
      API key for the model provider (overrides default)
    </ParamField>
    <ParamField path="baseURL" type="string" optional>
      Base URL for the API endpoint (for custom endpoints or proxies)
    </ParamField>
  </Expandable>
</ParamField>

<ParamField path="timeout" type="number" optional>
  Maximum time in milliseconds to wait for the extraction to complete. Default varies by configuration.
</ParamField>

<ParamField path="selector" type="string" optional>
  Optional selector (XPath, CSS selector, etc.) to limit extraction scope to a specific part of the page. Reduces token usage and improves accuracy.
</ParamField>

<ParamField path="page" type="PlaywrightPage | PuppeteerPage | PatchrightPage | Page" optional>
  Optional: Specify which page to perform the extraction on. Supports multiple browser automation libraries:
  - **Playwright**: Native Playwright Page objects
  - **Puppeteer**: Puppeteer Page objects
  - **Patchright**: Patchright Page objects
  - **Stagehand Page**: Stagehand's wrapped Page object

  If not specified, defaults to the current "active" page in your Stagehand instance.
</ParamField>

<ParamField path="serverCache" type="boolean" optional>
  Override the instance-level `serverCache` setting for this request. When `true`, enables server-side caching. When `false`, disables it.

  <Note>Only applies when `env` is `"BROWSERBASE"`. Has no effect in local environments.</Note>

  Defaults to the value set on the Stagehand constructor (which itself defaults to `true`).
</ParamField>

### Built-in Support

<Note>
**Iframe and Shadow DOM interactions are supported out of the box.** Stagehand automatically handles iframe traversal and shadow DOM elements without requiring additional configuration or flags.
</Note>

### Response Types

<Tabs>
<Tab title="With Schema">
**Returns:** `Promise<z.infer<T> & { cacheStatus?: "HIT" | "MISS" }>` where T is your schema

The returned object will be strictly typed according to your Zod schema definition. The optional `cacheStatus` field indicates whether the result was served from the server-side cache (`"HIT"`) or computed fresh (`"MISS"`). Only present when running with `env: "BROWSERBASE"` and server-side caching is enabled.
</Tab>

<Tab title="String Only">
**Returns:** `Promise<{ extraction: string; cacheStatus?: "HIT" | "MISS" }>`

`extraction`: Simple string extraction without schema validation. The optional `cacheStatus` field indicates cache hit or miss when using Browserbase with server-side caching.
</Tab>

<Tab title="No Parameters">
**Returns:** `Promise<{ pageText: string }>`

`pageText`: Raw accessibility tree representation of page content.
</Tab>
</Tabs>

### Code Examples

<Tabs>
<Tab title="Single Object">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";
import { z } from 'zod';

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com/product");

// Schema definition
const ProductSchema = z.object({
  name: z.string(),
  price: z.number(),
  inStock: z.boolean()
});

// Extraction with v3 API
const product = await stagehand.extract(
  "extract product details", 
  ProductSchema
);
```

#### Example Response
```json
{
  "name": "Product Name",
  "price": 100,
  "inStock": true
}
```

</Tab>
<Tab title="Arrays">

```typescript
import { z } from 'zod';

// Schema definition
const ApartmentListingsSchema = z.array(
  z.object({
    address: z.string(),
    price: z.string(),
    bedrooms: z.number()
  })
);

// Extraction with v3 API
const listings = await stagehand.extract(
  "extract all apartment listings",
  ApartmentListingsSchema
);
```

#### Example Response
```json
[
  {
    "address": "123 Main St",
    "price": "$100,000",
    "bedrooms": 3
  },
  {
    "address": "456 Elm St",
    "price": "$150,000",
    "bedrooms": 2
  }
]
```

</Tab>
<Tab title="URLs">

```typescript
import { z } from 'zod';

// Schema definition
const NavigationSchema = z.object({
  links: z.array(z.object({
    text: z.string(),
    url: z.string().url()  // URL validation
  }))
});

// Extraction with v3 API
const links = await stagehand.extract(
  "extract navigation links",
  NavigationSchema
);
```

#### Example Response
```json
{
  "links": [
    {
      "text": "Home",
      "url": "https://example.com"
    }
  ]
}
```

</Tab>
<Tab title="Scoped">

```typescript
import { z } from 'zod';

const ProductSchema = z.object({
  name: z.string(),
  price: z.number(),
  description: z.string()
});

// Extract from specific page section with v3 API
const data = await stagehand.extract(
  "extract product info from this section",
  ProductSchema,
  { selector: "/html/body/div/div" }
);
```

#### Example Response
```json
{
  "name": "Product Name",
  "price": 100,
  "description": "Product description"
}
```

</Tab>
<Tab title="Schema-less">

```typescript
// String only extraction
const title = await stagehand.extract("get the page title");
// Returns: { extraction: "Page Title" }

// Raw page content
const content = await stagehand.extract();
// Returns: { pageText: "Accessibility Tree: ..." }
```

#### Example Response
```json
{
  "extraction": "Page Title"
}
```

</Tab>
<Tab title="Advanced">

```typescript
import { z } from 'zod';

// Schema with descriptions and validation
const ProductSchema = z.object({
  price: z.number().describe("Product price in USD"),
  rating: z.number().min(0).max(5).describe("Customer rating out of 5"),
  available: z.boolean().describe("Whether product is in stock"),
  tags: z.array(z.string()).optional()
});

// Nested schema
const EcommerceSchema = z.object({
  product: z.object({
    name: z.string(),
    price: z.object({
      current: z.number(),
      original: z.number().optional()
    })
  }),
  reviews: z.array(z.object({
    rating: z.number(),
    comment: z.string()
  }))
});
```

#### Example Response
```json
{
  "product": {
    "name": "Product Name",
    "price": {
      "current": 100,
      "original": 120
    }
  },
  "reviews": [
    {
      "rating": 4,
      "comment": "Great product!"
    }
  ]
}
```

</Tab>
</Tabs>

### Additional Examples

<Tabs>
<Tab title="Custom Model">

```typescript
import { z } from 'zod';

const DataSchema = z.object({
  title: z.string(),
  content: z.string()
});

// Using string format
const data1 = await stagehand.extract(
  "extract article data",
  DataSchema,
  { model: "openai/gpt-5-mini" }
);

// Using object format with custom configuration
const data2 = await stagehand.extract(
  "extract article data",
  DataSchema,
  {
    model: {
      modelName: "claude-sonnet-4-6",
      apiKey: process.env.ANTHROPIC_API_KEY
    }
  }
);
```

</Tab>
<Tab title="Multi-Page">

```typescript
import { z } from 'zod';

const page1 = stagehand.context.pages()[0];
const page2 = await stagehand.context.newPage();

const Schema = z.object({ title: z.string() });

const data1 = await stagehand.extract("get title", Schema, { page: page1 });
const data2 = await stagehand.extract("get title", Schema, { page: page2 });
```

</Tab>
</Tabs>

### Error Types

The following errors may be thrown by the `extract()` method:

- **StagehandError** - Base class for all Stagehand-specific errors
- **ZodSchemaValidationError** - Extracted data does not match the provided Zod schema
- **StagehandDomProcessError** - Error occurred while processing the DOM
- **StagehandEvalError** - Error occurred while evaluating JavaScript in the page context
- **StagehandIframeError** - Unable to resolve iframe for the target element
- **ContentFrameNotFoundError** - Unable to obtain content frame for the selector
- **XPathResolutionError** - XPath does not resolve in the current page or frames
- **StagehandShadowRootMissingError** - No shadow root present on the resolved host element
- **LLMResponseError** - Error in LLM response processing
- **MissingLLMConfigurationError** - No LLM API key or client configured
- **UnsupportedModelError** - The specified model is not supported for this operation
- **InvalidAISDKModelFormatError** - Model string does not follow the required `provider/model` format

================================================
FILE: packages/docs/v3/references/locator.mdx
================================================
---
title: locator
description: 'Complete API reference for the Locator class'
icon: 'crosshairs'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Page" icon="browser" href="/v3/references/page">
  Learn about the Page object that creates locators
</Card>
</CardGroup>

## Overview

The `Locator` class provides precise element interaction capabilities. It resolves CSS or XPath selectors within a frame and performs low-level actions using Chrome DevTools Protocol (CDP).

Create a locator through the page object:

```typescript
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const page = stagehand.context.pages()[0];

// Create a locator
const button = page.locator("button.submit");
await button.click();
```

## Key Features

- **Lazy resolution** - Selectors are resolved fresh on each action
- **Isolated execution** - Runs in an isolated world, separate from page scripts
- **CDP-based** - Uses Chrome DevTools Protocol for reliable interactions
- **Automatic cleanup** - Releases remote objects automatically
- **Iframe support** - Works seamlessly with iframes and shadow DOM

## Interaction Methods

### click()

Click the element at its visual center.

```typescript
await locator.click(options?: ClickOptions): Promise<void>
```

<ParamField path="button" type='"left" | "right" | "middle"' optional>
  Mouse button to use for the click.

  **Default:** `"left"`
</ParamField>

<ParamField path="clickCount" type="number" optional>
  Number of consecutive clicks (for double-click, triple-click).

  **Default:** `1`
</ParamField>

The method:
1. Scrolls element into view
2. Gets element geometry
3. Moves mouse to center
4. Dispatches mousePressed and mouseReleased events

### fill()

Fill an input, textarea, or contenteditable element.

```typescript
await locator.fill(value: string): Promise<void>
```

<ParamField path="value" type="string" required>
  The text value to fill into the element.
</ParamField>

The method intelligently handles different input types:
- Uses native value setter for special inputs (date, number, etc.)
- Types text character-by-character for regular inputs
- Clears existing content before filling

### type()

Type text into the element with optional delay between keystrokes.

```typescript
await locator.type(text: string, options?: TypeOptions): Promise<void>
```

<ParamField path="text" type="string" required>
  The text to type.
</ParamField>

<ParamField path="delay" type="number" optional>
  Delay in milliseconds between each keystroke.

  If not specified, uses `Input.insertText` for efficiency.
</ParamField>

### hover()

Move the mouse cursor to the element's center without clicking.

```typescript
await locator.hover(): Promise<void>
```

Scrolls the element into view and dispatches a mouse move event.

### selectOption()

Select one or more options in a `<select>` element.

```typescript
await locator.selectOption(values: string | string[]): Promise<string[]>
```

<ParamField path="values" type="string | string[]" required>
  Option value(s) to select. For multi-select elements, pass an array.
</ParamField>

**Returns:** `Promise<string[]>` - Array of values that were actually selected.

### setInputFiles()

Set files on an `<input type="file">` element.

```typescript
await locator.setInputFiles(files: FileInput): Promise<void>
```

<ParamField path="files" type="string | string[] | FilePayload | FilePayload[]" required>
  File paths or file payloads to upload.

  **File Path:** Absolute or relative path to a file

  **File Payload:** Object with `{ name, mimeType, buffer }`
</ParamField>

**FilePayload Interface:**
```typescript
interface FilePayload {
  name: string;
  mimeType: string;
  buffer: ArrayBuffer | Uint8Array | Buffer | string;
}
```

Pass an empty array to clear the file selection.

## State Methods

### isVisible()

Check if the element is visible.

```typescript
await locator.isVisible(): Promise<boolean>
```

**Returns:** `Promise<boolean>` - `true` if element is attached and visible.

### isChecked()

Check if a checkbox or radio button is checked.

```typescript
await locator.isChecked(): Promise<boolean>
```

**Returns:** `Promise<boolean>` - `true` if checked. Also considers `aria-checked` for ARIA widgets.

### inputValue()

Get the current value of an input element.

```typescript
await locator.inputValue(): Promise<string>
```

**Returns:** `Promise<string>` - The element's input value.

Works with: `<input>`, `<textarea>`, `<select>`, contenteditable elements.

### textContent()

Get the element's text content (raw).

```typescript
await locator.textContent(): Promise<string>
```

**Returns:** `Promise<string>` - The element's `textContent` property.

### innerText()

Get the element's visible text (layout-aware).

```typescript
await locator.innerText(): Promise<string>
```

**Returns:** `Promise<string>` - The element's `innerText` property.

### innerHtml()

Get the element's HTML content.

```typescript
await locator.innerHtml(): Promise<string>
```

**Returns:** `Promise<string>` - The element's `innerHtml`.

## Selection Methods

### count()

Get the number of elements matching the selector.

```typescript
await locator.count(): Promise<number>
```

**Returns:** `Promise<number>` - Count of matching elements.

### nth()

Get a locator for the element at a specific index.

```typescript
locator.nth(index: number): Locator
```

<ParamField path="index" type="number" required>
  Zero-based index of the element to select.
</ParamField>

**Returns:** `Locator` - New locator targeting the nth element.

```typescript
// Get the third button
const thirdButton = page.locator("button").nth(2);
await thirdButton.click();
```

### first()

Get a locator for the first matching element.

```typescript
locator.first(): Locator
```

**Returns:** `Locator` - Returns the same locator (querySelector already returns first match).

## Utility Methods

### highlight()

Visually highlight the element with an overlay.

```typescript
await locator.highlight(options?: HighlightOptions): Promise<void>
```

<ParamField path="durationMs" type="number" optional>
  How long to display the highlight in milliseconds.

  **Default:** `800`
</ParamField>

<ParamField path="borderColor" type="{ r, g, b, a? }" optional>
  Border color RGBA values (0-255).

  **Default:** `{ r: 255, g: 0, b: 0, a: 0.9 }` (red)
</ParamField>

<ParamField path="contentColor" type="{ r, g, b, a? }" optional>
  Content fill color RGBA values (0-255).

  **Default:** `{ r: 255, g: 200, b: 0, a: 0.2 }` (yellow)
</ParamField>

Useful for debugging and visual verification.

### scrollTo()

Scroll the element to a specific position.

```typescript
await locator.scrollTo(percent: number | string): Promise<void>
```

<ParamField path="percent" type="number | string" required>
  Scroll position as percentage (0-100).
</ParamField>

For `<html>` or `<body>` elements, scrolls the window. Otherwise, scrolls the element itself.

### centroid()

Get the center coordinates of the element.

```typescript
await locator.centroid(): Promise<{ x: number; y: number }>
```

**Returns:** `Promise<{ x, y }>` - Center point in CSS pixels.

### backendNodeId()

Get the DOM backend node ID for the element.

```typescript
await locator.backendNodeId(): Promise<BackendNodeId>
```

**Returns:** `Promise<BackendNodeId>` - Unique identifier for the DOM node.

Useful for identity comparisons without maintaining element handles.

### sendClickEvent()

Dispatch a DOM click event directly on the element.

```typescript
await locator.sendClickEvent(options?: EventOptions): Promise<void>
```

<ParamField path="bubbles" type="boolean" optional>
  Whether the event bubbles.

  **Default:** `true`
</ParamField>

<ParamField path="cancelable" type="boolean" optional>
  Whether the event is cancelable.

  **Default:** `true`
</ParamField>

<ParamField path="composed" type="boolean" optional>
  Whether the event crosses shadow DOM boundaries.

  **Default:** `true`
</ParamField>

<ParamField path="detail" type="number" optional>
  Click count detail.

  **Default:** `1`
</ParamField>

This dispatches an event directly without synthesizing real pointer input. Useful for elements that rely on click handlers without needing hit-testing.

## Code Examples

<Tabs>
<Tab title="Basic Interaction">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

// Click a button
const submitButton = page.locator("button[type=submit]");
await submitButton.click();

// Fill an input
const emailInput = page.locator("input[name=email]");
await emailInput.fill("user@example.com");

// Type with delay
const searchBox = page.locator("input[type=search]");
await searchBox.type("stagehand", { delay: 100 });

await stagehand.close();
```

</Tab>
<Tab title="Forms">

```typescript
// Fill multiple form fields
const form = page.locator("form#login");

await page.locator("#username").fill("myuser");
await page.locator("#password").fill("mypass");

// Select from dropdown
await page.locator("select#country").selectOption("US");

// Multi-select
await page.locator("select#skills").selectOption(["js", "ts", "react"]);

// Check checkbox
const termsCheckbox = page.locator("input#terms");
const isChecked = await termsCheckbox.isChecked();
if (!isChecked) {
  await termsCheckbox.click();
}

// Submit
await page.locator("button[type=submit]").click();
```

</Tab>
<Tab title="File Upload">

```typescript
// Upload from file path
const fileInput = page.locator("input[type=file]");
await fileInput.setInputFiles("/path/to/document.pdf");

// Upload multiple files
await fileInput.setInputFiles([
  "/path/to/image1.jpg",
  "/path/to/image2.jpg"
]);

// Upload from buffer
await fileInput.setInputFiles({
  name: "data.json",
  mimeType: "application/json",
  buffer: JSON.stringify({ key: "value" })
});

// Clear file selection
await fileInput.setInputFiles([]);
```

</Tab>
<Tab title="Element Selection">

```typescript
// Count elements
const buttons = page.locator("button");
const count = await buttons.count();
console.log(`Found ${count} buttons`);

// Click the first button
await buttons.first().click();

// Click the third button
await buttons.nth(2).click();

// Iterate with nth
for (let i = 0; i < count; i++) {
  const button = buttons.nth(i);
  const text = await button.innerText();
  console.log(`Button ${i}: ${text}`);
}
```

</Tab>
<Tab title="State Checks">

```typescript
// Check visibility
const modal = page.locator(".modal");
if (await modal.isVisible()) {
  console.log("Modal is visible");
}

// Check checkbox state
const checkbox = page.locator("input#subscribe");
const checked = await checkbox.isChecked();
console.log("Subscribed:", checked);

// Get input value
const email = page.locator("input#email");
const value = await email.inputValue();
console.log("Email:", value);

// Get text content
const heading = page.locator("h1");
const text = await heading.textContent();
console.log("Heading:", text);
```

</Tab>
<Tab title="Advanced Actions">

```typescript
// Hover to reveal menu
const menuButton = page.locator("button.menu");
await menuButton.hover();

// Wait for submenu
await page.waitForLoadState("networkidle");

// Click submenu item
await page.locator("a.submenu-item").click();

// Highlight for debugging
await page.locator("div.error").highlight({
  durationMs: 2000,
  borderColor: { r: 255, g: 0, b: 0 },
  contentColor: { r: 255, g: 0, b: 0, a: 0.1 }
});

// Scroll element into position
const section = page.locator("#section-3");
await section.scrollTo(50); // Scroll to 50%

// Get element position
const { x, y } = await section.centroid();
console.log(`Element center: ${x}, ${y}`);
```

</Tab>
</Tabs>

## Selector Support

Locators support both CSS and XPath selectors:

### CSS Selectors

```typescript
page.locator("button");                    // Tag
page.locator(".submit-btn");              // Class
page.locator("#login-form");              // ID
page.locator("button.primary");           // Tag + class
page.locator("input[type=email]");        // Attribute
page.locator("div > p");                  // Child
page.locator("h1 + p");                   // Adjacent sibling
page.locator("div.container button");     // Descendant
```

### XPath Selectors

```typescript
page.locator("//button");                               // Tag
page.locator("//button[@class='submit']");             // Attribute
page.locator("//div[@id='content']//p");               // Descendant
page.locator("//button[contains(text(), 'Submit')]");  // Text content
page.locator("(//button)[1]");                         // First button
page.locator("//input[@type='text'][1]");              // First text input
```

## Best Practices

1. **Use specific selectors** - Prefer IDs or unique attributes over generic selectors
2. **Chain with nth()** - Use `locator().nth()` instead of putting index in selector
3. **Check state before action** - Use `isVisible()`, `isChecked()` for conditional logic
4. **Let locators auto-resolve** - Don't store element handles, use locators which re-resolve
5. **Use fill() for inputs** - Prefer `fill()` over `click()` + `type()` for better reliability
6. **Handle file uploads properly** - Use absolute paths or buffer payloads for `setInputFiles()`
7. **Highlight for debugging** - Use `highlight()` during development to verify targeting

## Common Patterns

### Conditional Interaction

```typescript
const errorMessage = page.locator(".error-message");
if (await errorMessage.isVisible()) {
  const text = await errorMessage.textContent();
  console.log("Error:", text);
}
```

### Wait and Interact

```typescript
// Locators automatically wait during actions
const dynamicButton = page.locator("button.dynamic");
await dynamicButton.click(); // Waits for element to exist
```

### Loop Through Elements

```typescript
const items = page.locator("li.item");
const count = await items.count();

for (let i = 0; i < count; i++) {
  const item = items.nth(i);
  const text = await item.innerText();
  console.log(`Item ${i}:`, text);
}
```

## Error Handling

Locator methods may throw the following errors:

- **Element not found** - Selector doesn't match any elements
- **Element not visible** - Element exists but is not visible (for actions requiring visibility)
- **Invalid selector** - Malformed CSS or XPath selector
- **Timeout errors** - Operation exceeded timeout limits
- **CDP errors** - Chrome DevTools Protocol communication errors

Handle errors appropriately:

```typescript
try {
  await page.locator("button.submit").click();
} catch (error) {
  console.error("Click failed:", error.message);
}
```

## Type Definitions

```typescript
interface Locator {
  // Actions
  click(options?: { button?: MouseButton; clickCount?: number }): Promise<void>;
  fill(value: string): Promise<void>;
  type(text: string, options?: { delay?: number }): Promise<void>;
  hover(): Promise<void>;
  selectOption(values: string | string[]): Promise<string[]>;
  setInputFiles(files: FileInput): Promise<void>;

  // State
  isVisible(): Promise<boolean>;
  isChecked(): Promise<boolean>;
  inputValue(): Promise<string>;
  textContent(): Promise<string>;
  innerText(): Promise<string>;
  innerHtml(): Promise<string>;

  // Selection
  count(): Promise<number>;
  nth(index: number): Locator;
  first(): Locator;

  // Utilities
  highlight(options?: HighlightOptions): Promise<void>;
  scrollTo(percent: number | string): Promise<void>;
  centroid(): Promise<{ x: number; y: number }>;
  backendNodeId(): Promise<BackendNodeId>;
  sendClickEvent(options?: EventOptions): Promise<void>;
}
```


================================================
FILE: packages/docs/v3/references/observe.mdx
================================================
---
title: observe()
description: 'Complete API reference for the observe() method'
icon: 'magnifying-glass'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Observe" icon="magnifying-glass" href="/v3/basics/observe">
  See how to use observe() to discover actionable elements and analyze web page structure
</Card>
</CardGroup>

### Method Signatures

<Tabs>
<Tab title="TypeScript">

```typescript
// String instruction only
await stagehand.observe(instruction: string): Promise<Action[]>

// String instruction with options
await stagehand.observe(instruction: string, options: ObserveOptions): Promise<Action[]>
```

**ObserveOptions Interface:**
```typescript
interface ObserveOptions {
  model?: ModelConfiguration;
  timeout?: number;
  selector?: string;
  page?: PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
  serverCache?: boolean;
}

// ModelConfiguration can be either a string or an object
type ModelConfiguration =
  | string  // Format: "provider/model" (e.g., "openai/gpt-4o", "anthropic/claude-sonnet-4-6")
  | {
      modelName: string;  // The model name
      apiKey?: string;    // Optional: API key override
      baseURL?: string;   // Optional: Base URL override
      // Additional provider-specific options
    }
```

</Tab>

</Tabs>

### Parameters

<ParamField path="instruction" type="string" required>
  Natural language description of elements or actions to discover. If not provided, defaults to finding all interactive elements on the page.
</ParamField>

<ParamField path="model" type="ModelConfiguration" optional>
  Configure the AI model to use for this observation. Can be either:
  - A string in the format `"provider/model"` (e.g., `"openai/gpt-4o"`, `"anthropic/claude-sonnet-4-6"`)
  - An object with detailed configuration

  <Expandable title="Model Configuration Object">
    <ParamField path="modelName" type="string" required>
      The model name (e.g., "gpt-4o", "claude-sonnet-4-6", "gemini-2.5-flash")
    </ParamField>
    <ParamField path="apiKey" type="string" optional>
      API key for the model provider (overrides default)
    </ParamField>
    <ParamField path="baseURL" type="string" optional>
      Base URL for the API endpoint (for custom endpoints or proxies)
    </ParamField>
  </Expandable>
</ParamField>

<ParamField path="timeout" type="number" optional>
  Maximum time in milliseconds to wait for the observation to complete. Default varies by configuration.
</ParamField>

<ParamField path="selector" type="string" optional>
  Optional XPath selector to focus the observation on a specific part of the page. Useful for narrowing down the search area.
</ParamField>

<ParamField path="page" type="PlaywrightPage | PuppeteerPage | PatchrightPage | Page" optional>
  Optional: Specify which page to perform the observation on. Supports multiple browser automation libraries:
  - **Playwright**: Native Playwright Page objects
  - **Puppeteer**: Puppeteer Page objects
  - **Patchright**: Patchright Page objects
  - **Stagehand Page**: Stagehand's wrapped Page object

  If not specified, defaults to the current "active" page in your Stagehand instance.
</ParamField>

<ParamField path="serverCache" type="boolean" optional>
  Override the instance-level `serverCache` setting for this request. When `true`, enables server-side caching. When `false`, disables it.

  <Note>Only applies when `env` is `"BROWSERBASE"`. Has no effect in local environments.</Note>

  Defaults to the value set on the Stagehand constructor (which itself defaults to `true`).
</ParamField>

### Returns `Promise<Action[]>`

Array of discovered actionable elements, ordered by relevance.

<ResponseField name="selector" type="string">
  XPath selector that precisely locates the element on the page.
</ResponseField>

<ResponseField name="description" type="string">
  Human-readable description of the element and its purpose.
</ResponseField>

<ResponseField name="method" type="string" optional>
  Suggested interaction method for the element (e.g., `"click"`, `"fill"`, `"type"`).
</ResponseField>

<ResponseField name="arguments" type="string[]" optional>
  Additional parameters for the suggested action, if applicable.
</ResponseField>

**Action Interface:**
```typescript
interface Action {
  selector: string;        // XPath selector to locate element
  description: string;     // Human-readable description
  method?: string;         // Suggested action method
  arguments?: string[];    // Additional action parameters
}
```

**Example Response:**
```json
[
  {
    "selector": "/html/body/div[1]/header/nav/button[1]",
    "description": "Login button in the navigation bar",
    "method": "click",
    "arguments": []
  },
  {
    "selector": "/html/body/main/form/input[1]",
    "description": "Email input field in the login form",
    "method": "fill",
    "arguments": []
  }
]
```

### Built-in Support

<Note>
**Iframe and Shadow DOM interactions are supported out of the box.** Stagehand automatically handles iframe traversal and shadow DOM elements without requiring additional configuration or flags.
</Note>

### Code Examples

<Tabs>
<Tab title="Basic Usage">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");

// Basic element discovery
const buttons = await stagehand.observe("find all clickable buttons");
const formFields = await stagehand.observe("locate form input fields");

// Working with results
const [loginButton] = await stagehand.observe("find the login button");
if (loginButton) {
  console.log("Found:", loginButton.description);
  console.log("Selector:", loginButton.selector);
  await stagehand.act(loginButton); // Execute the action
}
```

</Tab>
<Tab title="Custom Model">

```typescript
// Using string format model
const elements = await stagehand.observe("find important call-to-action buttons", {
  model: "openai/gpt-4o",
  timeout: 45000
});

// Using object format with custom configuration
const actions = await stagehand.observe("find navigation links", {
  model: {
    modelName: "claude-sonnet-4-6",
    apiKey: process.env.ANTHROPIC_API_KEY
  },
  timeout: 30000
});
```

</Tab>
<Tab title="Scoped">

```typescript
// Focus observation on a specific part of the page
const tableActions = await stagehand.observe("find all table rows", {
  selector: "/html/body/main/table"
});
```

</Tab>
<Tab title="Multi-Page">

```typescript
// Observe on specific pages
const page1 = stagehand.context.pages()[0];
const page2 = await stagehand.context.newPage();

const page1Actions = await stagehand.observe("find navigation", { page: page1 });
const page2Actions = await stagehand.observe("find buttons", { page: page2 });
```

</Tab>
<Tab title="Filter Results">

```typescript
const submitButtons = await stagehand.observe("find all submit buttons");
const primarySubmit = submitButtons.find(btn =>
  btn.description.toLowerCase().includes('primary')
);
```

</Tab>
</Tabs>

### Integration Patterns

```typescript
// Observe → Act workflow
const actions = await stagehand.observe("find checkout elements");
for (const action of actions) {
  await stagehand.act(action);
  await page.waitForTimeout(1000);
}

// Observe → Extract workflow
const tables = await stagehand.observe("find data tables");
if (tables.length > 0) {
  const data = await stagehand.extract({
    instruction: "extract the table data",
    selector: tables[0].selector,
    schema: DataSchema
  });
}

// Element validation
const requiredElements = await stagehand.observe("find the login form");
if (requiredElements.length === 0) {
  throw new Error("Login form not found");
}
```

### Error Types

The following errors may be thrown by the `observe()` method:

- **StagehandError** - Base class for all Stagehand-specific errors
- **StagehandDomProcessError** - Error occurred while processing the DOM
- **StagehandEvalError** - Error occurred while evaluating JavaScript in the page context
- **StagehandIframeError** - Unable to resolve iframe for the target element
- **ContentFrameNotFoundError** - Unable to obtain content frame for the selector
- **XPathResolutionError** - XPath does not resolve in the current page or frames
- **StagehandShadowRootMissingError** - No shadow root present on the resolved host element
- **LLMResponseError** - Error in LLM response processing
- **MissingLLMConfigurationError** - No LLM API key or client configured
- **UnsupportedModelError** - The specified model is not supported for this operation
- **InvalidAISDKModelFormatError** - Model string does not follow the required `provider/model` format


================================================
FILE: packages/docs/v3/references/page.mdx
================================================
---
title: page
description: 'Complete API reference for the Stagehand Page object'
icon: 'page'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />

<CardGroup cols={1}>
<Card title="Page" icon="browser" href="/v3/references/page">
  Learn about the Stagehand Page object and browser navigation
</Card>
</CardGroup>

## Overview

The `page` object is the main interface for interacting with browser pages in Stagehand. It provides standard browser automation capabilities for navigation, interaction, and page inspection.

Access the page object through your Stagehand instance:

```typescript
const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const page = stagehand.context.pages()[0];
```

## Navigation Methods

### goto()

Navigate the page to a URL and wait for a lifecycle state.

```typescript
await page.goto(url: string, options?: GotoOptions): Promise<Response | null>
```

Returns a [Response](/v3/references/response) when the navigation produces a network document request, otherwise `null` (e.g. `data:` URLs or same-document navigations).

<ParamField path="url" type="string" required>
  The URL to navigate to. Can be absolute or relative.
</ParamField>

<ParamField path="waitUntil" type="LoadState" optional>
  When to consider navigation succeeded.

  **Options:**
  - `"load"` - Wait for the load event
  - `"domcontentloaded"` - Wait for DOMContentLoaded event (default)
  - `"networkidle"` - Wait for network to be idle

  **Default:** `"domcontentloaded"`
</ParamField>

<ParamField path="timeoutMs" type="number" optional>
  Maximum time to wait for navigation in milliseconds.

  **Default:** `15000`
</ParamField>

### reload()

Reload the current page.

```typescript
await page.reload(options?: ReloadOptions): Promise<Response | null>
```

Resolves with a [Response](/v3/references/response) for the refreshed document when one is reported, otherwise `null`.

<ParamField path="waitUntil" type="LoadState" optional>
  When to consider reload complete. See `goto()` for options.
</ParamField>

<ParamField path="timeoutMs" type="number" optional>
  Maximum time to wait for reload in milliseconds.

  **Default:** `15000`
</ParamField>

<ParamField path="ignoreCache" type="boolean" optional>
  Whether to bypass the browser cache.

  **Default:** `false`
</ParamField>

### goBack()

Navigate back in browser history.

```typescript
await page.goBack(options?: NavigationOptions): Promise<Response | null>
```

Returns a [Response](/v3/references/response) when the history entry triggers a network fetch; otherwise `null`.

<ParamField path="waitUntil" type="LoadState" optional>
  When to consider navigation complete.
</ParamField>

<ParamField path="timeoutMs" type="number" optional>
  Maximum time to wait in milliseconds.

  **Default:** `15000`
</ParamField>

### goForward()

Navigate forward in browser history.

```typescript
await page.goForward(options?: NavigationOptions): Promise<Response | null>
```

Returns a [Response](/v3/references/response) when the navigation loads a new document from the network; otherwise `null`.

<ParamField path="waitUntil" type="LoadState" optional>
  When to consider navigation complete.
</ParamField>

<ParamField path="timeoutMs" type="number" optional>
  Maximum time to wait in milliseconds.

  **Default:** `15000`
</ParamField>

## Page Information

### url()

Get the current page URL (synchronous).

```typescript
page.url(): string
```

**Returns:** The current page URL as a string.

### title()

Get the current page title.

```typescript
await page.title(): Promise<string>
```

**Returns:** The page title as a string.

## Interaction Methods

### click()

Click at absolute page coordinates.

```typescript
await page.click(x: number, y: number, options?: ClickOptions): Promise<string>
```

**Returns:** A string containing the XPath of the clicked element when `returnXpath` is `true`, otherwise an empty string.

<ParamField path="x" type="number" required>
  X coordinate in CSS pixels.
</ParamField>

<ParamField path="y" type="number" required>
  Y coordinate in CSS pixels.
</ParamField>

<ParamField path="options" type="object" optional>
  Optional click configuration.

  <Expandable title="properties">
    <ParamField path="button" type="string">
      Mouse button to use: `"left"` | `"right"` | `"middle"`

      Default: `"left"`
    </ParamField>

    <ParamField path="clickCount" type="number">
      Number of consecutive clicks.

      Default: `1`
    </ParamField>

    <ParamField path="returnXpath" type="boolean">
      If `true`, the returned string contains the XPath of the clicked element. If `false`, returns an empty string.

      Default: `false`
    </ParamField>
  </Expandable>
</ParamField>

### hover()

Hover at absolute page coordinates without clicking.

```typescript
await page.hover(x: number, y: number, options?: HoverOptions): Promise<string>
```

**Returns:** A string containing the XPath of the hovered element when `returnXpath` is `true`, otherwise an empty string.

<ParamField path="x" type="number" required>
  X coordinate in CSS pixels.
</ParamField>

<ParamField path="y" type="number" required>
  Y coordinate in CSS pixels.
</ParamField>

<ParamField path="options" type="object" optional>
  Optional hover configuration.

  <Expandable title="properties">
    <ParamField path="returnXpath" type="boolean">
      If `true`, the returned string contains the XPath of the hovered element. If `false`, returns an empty string.

      Default: `false`
    </ParamField>
  </Expandable>
</ParamField>

### scroll()

Scroll at absolute page coordinates using mouse wheel events.

```typescript
await page.scroll(x: number, y: number, deltaX: number, deltaY: number, options?: ScrollOptions): Promise<string>
```

**Returns:** A string containing the XPath of the element at the scroll position when `returnXpath` is `true`, otherwise an empty string.

<ParamField path="x" type="number" required>
  X coordinate in CSS pixels where the scroll occurs.
</ParamField>

<ParamField path="y" type="number" required>
  Y coordinate in CSS pixels where the scroll occurs.
</ParamField>

<ParamField path="deltaX" type="number" required>
  Horizontal scroll amount in pixels. Positive values scroll right.
</ParamField>

<ParamField path="deltaY" type="number" required>
  Vertical scroll amount in pixels. Positive values scroll down.
</ParamField>

<ParamField path="options" type="object" optional>
  Optional scroll configuration.

  <Expandable title="properties">
    <ParamField path="returnXpath" type="boolean">
      If `true`, the returned string contains the XPath of the element at the scroll position. If `false`, returns an empty string.

      Default: `false`
    </ParamField>
  </Expandable>
</ParamField>

### dragAndDrop()

Drag from one position to another using mouse events.

```typescript
const [fromXpath, toXpath] = await page.dragAndDrop(fromX, fromY, toX, toY, options?)
```

**Returns:** An array of two strings containing the XPaths of the elements at the start and end positions when `returnXpath` is `true`, otherwise empty strings.

<ParamField path="fromX" type="number" required>
  Starting X coordinate in CSS pixels.
</ParamField>

<ParamField path="fromY" type="number" required>
  Starting Y coordinate in CSS pixels.
</ParamField>

<ParamField path="toX" type="number" required>
  Ending X coordinate in CSS pixels.
</ParamField>

<ParamField path="toY" type="number" required>
  Ending Y coordinate in CSS pixels.
</ParamField>

<ParamField path="options" type="object" optional>
  Optional drag configuration.

  <Expandable title="properties">
    <ParamField path="button" type="string">
      Mouse button to use: `"left"` | `"right"` | `"middle"`

      Default: `"left"`
    </ParamField>

    <ParamField path="steps" type="number">
      Number of intermediate mouse move events during the drag.

      Default: `1`
    </ParamField>

    <ParamField path="delay" type="number">
      Delay in milliseconds between intermediate move events.

      Default: `0`
    </ParamField>

    <ParamField path="returnXpath" type="boolean">
      If `true`, the returned array contains the XPaths of the elements at the start and end positions. If `false`, returns empty strings.

      Default: `false`
    </ParamField>
  </Expandable>
</ParamField>

### type()

Type text into the page (dispatches keyboard events).

```typescript
await page.type(text: string, options?: TypeOptions): Promise<void>
```

<ParamField path="text" type="string" required>
  The text to type.
</ParamField>

<ParamField path="options" type="object" optional>
  Optional typing configuration.

  <Expandable title="properties">
    <ParamField path="delay" type="number">
      Delay between key presses in milliseconds.
    </ParamField>

    <ParamField path="withMistakes" type="boolean">
      Simulates typing with occasional mistakes and corrections.

      Default: `false`
    </ParamField>
  </Expandable>
</ParamField>

### locator()

Create a locator for querying elements.

```typescript
page.locator(selector: string): Locator
```

<ParamField path="selector" type="string" required>
  CSS selector or XPath for the element.
</ParamField>

**Returns:** A `Locator` object for interacting with the element.

## Evaluation

### evaluate()

Evaluate JavaScript code in the page context.

```typescript
await page.evaluate<R, Arg>(
  pageFunctionOrExpression: string | ((arg: Arg) => R | Promise<R>),
  arg?: Arg
): Promise<R>
```

<ParamField path="pageFunctionOrExpression" type="string | function" required>
  JavaScript expression as a string or a function to execute in the page context.
</ParamField>

<ParamField path="arg" type="any" optional>
  Optional argument to pass to the function.
</ParamField>

**Returns:** The result of the evaluation (must be JSON-serializable).

## Initialization Scripts

### addInitScript()

Inject JavaScript that runs before any of the page's scripts on every navigation.

```typescript
await page.addInitScript<Arg>(
  script: string | { path?: string; content?: string } | ((arg: Arg) => unknown),
  arg?: Arg,
): Promise<void>
```

<ParamField
  path="script"
  type="string | { path?: string; content?: string } | (arg: Arg) => unknown"
  required
>
  Provide the script to inject. Pass raw source, reference a preload file on disk,
  or supply a function that Stagehand serializes before sending to the browser.
</ParamField>

<ParamField path="arg" type="Arg" optional>
  Extra data that is JSON-serialized and passed to your function. Only supported
  when `script` is a function.
</ParamField>

This method:
- Runs at document start for the current page (including adopted iframe sessions) on every navigation
- Reinstalls the script for all future navigations of this page without affecting other pages
- Mirrors Playwright's `page.addInitScript()` ordering semantics; use  [`context.addInitScript()`](/v3/references/context#addinitscript) to target every page in the context

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const context = stagehand.context;
const page = await context.awaitActivePage();

await page.addInitScript(() => {
  window.Math.random = () => 42;
});

await page.goto("https://example.com", { waitUntil: "load" });

const result = await page.evaluate(() => Math.random());
console.log("Math.random() returned:", result);

// Math.random() returned: 42
```

## HTTP Headers

### setExtraHTTPHeaders()

Set HTTP headers that will be included in every request made by this page.

```typescript
await page.setExtraHTTPHeaders(headers: Record<string, string>): Promise<void>
```

<ParamField path="headers" type="Record<string, string>" required>
  A plain object of header name–value pairs. All values must be strings.
</ParamField>

This method:
- Applies the headers to the page's main CDP session and all of its child sessions (e.g. out-of-process iframes)
- Automatically applies the same headers to any child sessions adopted after calling `setExtraHTTPHeaders()`
- Calling it again replaces all previously set extra headers (it does not merge)
- To clear all extra headers, pass an empty object: `await page.setExtraHTTPHeaders({})`

<Note>
Headers set via `page.setExtraHTTPHeaders()` are page-scoped. They apply to every network request from this page only, including navigation requests, XHR/fetch calls, and subresource loads. Use [`context.setExtraHTTPHeaders()`](/v3/references/context#setextrahttpheaders) to set headers across all pages in the context.
</Note>

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const page = stagehand.context.pages()[0];

// Set custom headers for all requests from this page
await page.setExtraHTTPHeaders({
  "X-Custom-Token": "my-secret-token",
  "Accept-Language": "en-US",
});

// All subsequent requests from this page will include these headers
await page.goto("https://example.com");
```

## Screenshot

### screenshot()

Capture a screenshot of the page.

```typescript
await page.screenshot(options?: ScreenshotOptions): Promise<Buffer>
```

<ParamField path="fullPage" type="boolean" optional>
  Capture the entire scrollable page instead of just the current viewport.

  **Default:** `false`
</ParamField>

<ParamField path="clip" type="ScreenshotClip" optional>
  Limit the capture to the provided rectangle in CSS pixels (`{ x, y, width, height }`).
  Cannot be combined with `fullPage`.
</ParamField>

<ParamField path="type" type="'png' | 'jpeg'" optional>
  Image format for the screenshot.

  **Default:** `"png"`
</ParamField>

<ParamField path="quality" type="number" optional>
  JPEG quality (0–100). Only used when `type` is `"jpeg"`.
</ParamField>

<ParamField path="scale" type="'css' | 'device'" optional>
  Rendering scale. Use `"css"` for one pixel per CSS pixel, or `"device"` for the
  device pixel ratio.

  **Default:** `"device"`
</ParamField>

<ParamField path="animations" type="'allow' | 'disabled'" optional>
  Control CSS/Web animations and transitions. `"disabled"` fast-forwards finite
  animations and pauses infinite ones before capture.

  **Default:** `"allow"`
</ParamField>

<ParamField path="caret" type="hide | initial" optional>
  Hide the text caret during capture (`"hide"`) or leave it untouched (`"initial"`).

  **Default:** `"hide"`
</ParamField>

<ParamField path="mask" type="Locator[]" optional>
  List of locators to cover with a colored overlay while the screenshot is taken.
</ParamField>

<ParamField path="maskColor" type="string" optional>
  CSS color to use for masked overlays.

  **Default:** `#FF00FF`
</ParamField>

<ParamField path="style" type="string" optional>
  Additional CSS text injected into every frame just before capture. Useful for
  hiding or tweaking dynamic UI.
</ParamField>

<ParamField path="omitBackground" type="boolean" optional>
  Make the default page background transparent (PNG only).

  **Default:** `false`
</ParamField>

<ParamField path="timeout" type="number" optional>
  Maximum time in milliseconds to wait for the capture before throwing.
</ParamField>

<ParamField path="path" type="string" optional>
  Write the screenshot to the provided file path. The image is still returned as
  a buffer.
</ParamField>

**Returns:** A `Promise<Buffer>` containing the screenshot image data.

## Page Snapshot

### snapshot()

Capture a structured accessibility snapshot of the current page. The returned data combines a human-readable accessibility tree with lookup maps so you can relate each node to DOM selectors or URLs.

```typescript
await page.snapshot(options?: PageSnapshotOptions): Promise<SnapshotResult>
```

<ParamField path="options" type="PageSnapshotOptions" optional>
  Optional configuration for the snapshot.

  <Expandable title="properties">
    <ParamField path="includeIframes" type="boolean">
      Whether to include iframe content in the snapshot.

      **Default:** `true`
    </ParamField>
  </Expandable>
</ParamField>

**Returns:** A `Promise<SnapshotResult>` describing the captured accessibility tree.

<Expandable title="SnapshotResult properties">
  <ParamField path="formattedTree" type="string">
    Multiline text representing the accessibility tree hierarchy with encoded IDs.
  </ParamField>
  <ParamField path="xpathMap" type="Record<string, string>">
    Maps each encoded ID to the element's absolute XPath for quick DOM lookups.
  </ParamField>
  <ParamField path="urlMap" type="Record<string, string>">
    Maps encoded IDs for link-like nodes to their resolved URLs.
  </ParamField>
</Expandable>

See [SnapshotResult](#snapshotresult) for the static type definition.

The formatted tree represents every accessibility node with:
- A unique encoded ID in brackets (e.g., `[0-1]`) for cross-referencing with the maps
- The node's accessibility role (`RootWebArea`, `heading`, `link`, `button`, etc.)
- The node's accessible name, when available

**Example formatted output:**

```txt
[0-1] RootWebArea: Example Domain
  [0-3] heading: Example Domain
  [0-5] paragraph: This domain is for use in illustrative examples in documents.
  [0-8] link: More information...
```

**Example usage:**

```typescript
const page = stagehand.context.pages()[0];
await page.goto("https://example.com");

const { formattedTree, xpathMap, urlMap } = await page.snapshot();

// Print the accessibility tree
console.log(formattedTree);

// Look up a specific element's XPath by encoded ID
const linkId = "0-8";
console.log(xpathMap[linkId]); // e.g., "/html/body/div/p[2]/a"

// Resolve a link's URL via the urlMap
console.log(urlMap[linkId]); // e.g., "https://www.example.com"

// Exclude iframe content when you only need the main document
const mainDocumentSnapshot = await page.snapshot({ includeIframes: false });
```

## Viewport

### setViewportSize()

Set the page viewport size.

```typescript
await page.setViewportSize(
  width: number,
  height: number,
  options?: ViewportOptions
): Promise<void>
```

<ParamField path="width" type="number" required>
  Viewport width in CSS pixels.
</ParamField>

<ParamField path="height" type="number" required>
  Viewport height in CSS pixels.
</ParamField>

<ParamField path="deviceScaleFactor" type="number" optional>
  Device scale factor (pixel ratio).

  **Default:** `1`
</ParamField>

## Wait Methods

### waitForLoadState()

Wait for the page to reach a specific lifecycle state.

```typescript
await page.waitForLoadState(state: LoadState, timeoutMs?: number): Promise<void>
```

<ParamField path="state" type="LoadState" required>
  The lifecycle state to wait for.

  **Options:** `"load"`, `"domcontentloaded"`, `"networkidle"`
</ParamField>

<ParamField path="timeoutMs" type="number" optional>
  Maximum time to wait in milliseconds.

  **Default:** `15000`
</ParamField>

### waitForSelector()

Wait for an element matching the selector to reach a specific state in the DOM. Uses a MutationObserver for efficiency, pierces shadow DOM by default, and supports iframe hops when needed.

```typescript
await page.waitForSelector(
  selector: string,
  options?: {
    state?: "attached" | "detached" | "visible" | "hidden";
    timeout?: number;
    pierceShadow?: boolean;
  }
): Promise<boolean>
```

<ParamField path="selector" type="string" required>
  CSS selector or XPath expression to wait for. Supports iframe hops (e.g., `/html/div/iframe/html/div/button`).
</ParamField>

<ParamField path="options" type="object" optional>
  Optional wait configuration.

  <Expandable title="properties">
    <ParamField path="state" type="'attached' | 'detached' | 'visible' | 'hidden'">
      Element state to wait for.

      **Options:**
      - `"attached"` - Element is present in DOM (even if hidden)
      - `"detached"` - Element is removed from DOM
      - `"visible"` - Element is visible
      - `"hidden"` - Element is hidden

      **Default:** `"visible"`
    </ParamField>

    <ParamField path="timeout" type="number">
      Maximum time to wait in milliseconds before timing out.

      **Default:** `30000`
    </ParamField>

    <ParamField path="pierceShadow" type="boolean">
      Whether to search inside open and closed shadow DOM boundaries.

      **Default:** `true`
    </ParamField>
  </Expandable>
</ParamField>

**Returns:** `true` when the condition is met.

**Throws:** Error if timeout is reached before the condition is met.

## Events

### on("console")

Listen for console output produced by the page and any adopted iframe sessions. Returns the page instance so calls can be chained.

```typescript
import type { ConsoleMessage } from "@browserbasehq/stagehand";

const handleConsole = (message: ConsoleMessage) => {
  console.log(`[${message.type()}] ${message.text()}`);
  console.log("Arguments:", message.args());
  const location = message.location();
  if (location?.url) {
    console.log(`Emitted from ${location.url}:${location.lineNumber ?? 0}`);
  }
};

page.on("console", handleConsole);
```

`ConsoleMessage` exposes helpers for working with console events:

- `message.type()` – console API category such as `log`, `error`, or `warning`
- `message.text()` – string representation of the console arguments
- `message.args()` – underlying CDP `RemoteObject` arguments array
- `message.location()` – source URL, line, and column when available
- `message.timestamp()` – CDP timestamp for the event
- `message.raw()` – access to the original `Runtime.consoleAPICalledEvent`

### once("console")

Register a listener that removes itself after the first console event.

```typescript
page.once("console", (message) => {
  console.log("First console message:", message.text());
});
```

### off("console")

Remove a previously registered listener. The reference must match the original listener passed to `on()`.

```typescript
page.off("console", handleConsole);
```

## Code Examples

<Tabs>
<Tab title="Basic Navigation">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Initialize with Browserbase (API key and project ID from environment variables)
// Set BROWSERBASE_API_KEY and BROWSERBASE_PROJECT_ID in your environment
const stagehand = new Stagehand({ env: "BROWSERBASE" });
await stagehand.init();
const page = stagehand.context.pages()[0];

// Navigate to a URL
await page.goto("https://example.com");

// Get current URL and title
console.log("URL:", page.url());
console.log("Title:", await page.title());

// Navigate back and forward
await page.goBack();
await page.goForward();

// Reload the page
await page.reload();
```

</Tab>
<Tab title="Screenshots">

```typescript
// Capture viewport screenshot
const screenshot = await page.screenshot();
await fs.writeFile("screenshot.png", screenshot);

// Capture full page screenshot
const fullPage = await page.screenshot({ fullPage: true });
await fs.writeFile("fullpage.png", fullPage);

// Capture JPEG with styling overrides and a masked element
const styled = await page.screenshot({
  type: "jpeg",
  quality: 80,
  style: "body { filter: grayscale(1); }",
  mask: [page.locator(".ads-banner")],
  maskColor: "rgba(0, 0, 0, 0.3)",
});
await fs.writeFile("styled.jpg", styled);
```

</Tab>
<Tab title="JavaScript Evaluation">

```typescript
// Execute JavaScript expression
const pageHeight = await page.evaluate("document.body.scrollHeight");
console.log("Page height:", pageHeight);

// Execute function with arguments
const result = await page.evaluate((selector) => {
  const element = document.querySelector(selector);
  return element ? element.textContent : null;
}, "h1");
console.log("H1 text:", result);

// Async function evaluation
const data = await page.evaluate(async () => {
  const response = await fetch("/api/data");
  return response.json();
});
```

</Tab>
<Tab title="Interaction">

```typescript
// Click at coordinates
await page.click(100, 200);

// Double click
await page.click(100, 200, { clickCount: 2 });

// Click and get the XPath of the clicked element
const xpath = await page.click(100, 200, { returnXpath: true });
console.log("Clicked element xpath:", xpath); // e.g., "/html/body/div[1]/button"

// Hover at coordinates
await page.hover(300, 150);

// Hover and get the XPath of the hovered element
const hoverXpath = await page.hover(300, 150, { returnXpath: true });

// Scroll down at a position
await page.scroll(400, 300, 0, 200); // scroll down 200px

// Drag and drop between two points
const [fromXpath, toXpath] = await page.dragAndDrop(100, 100, 300, 300, { returnXpath: true });

// Type text
await page.type("Hello, World!");

// Type with delay between keystrokes
await page.type("Slow typing", { delay: 100 });

// Use locator for element interaction
const button = page.locator("button.submit");
await button.click();
```

</Tab>
<Tab title="Wait for Load">

```typescript
// Navigate and wait for full load
await page.goto("https://example.com", {
  waitUntil: "load",
  timeoutMs: 30000
});

// Wait for network idle after navigation
await page.goto("https://spa-app.com", {
  waitUntil: "networkidle"
});

// Wait for specific load state
await page.waitForLoadState("domcontentloaded");
```

</Tab>
<Tab title="Wait for Selector">

```typescript
// Wait for element to be visible (default)
await page.waitForSelector("#submit-btn");

// Wait for element to appear with custom timeout
await page.waitForSelector(".loading-spinner", {
  state: "visible",
  timeout: 10000
});

// Wait for element to be removed from DOM
await page.waitForSelector(".loading-spinner", {
  state: "detached"
});

// Wait for element to become hidden
await page.waitForSelector(".modal", {
  state: "hidden"
});

// Wait for element inside an iframe
await page.waitForSelector("iframe#checkout >> .pay-button");

// Wait for element in shadow DOM (enabled by default)
await page.waitForSelector("#shadow-button", {
  pierceShadow: true
});

// Wait for element with XPath
await page.waitForSelector("/html/div/button");
```

</Tab>
<Tab title="Viewport">

```typescript
// Set viewport size
await page.setViewportSize(1920, 1080);

// Set mobile viewport with device scale
await page.setViewportSize(375, 667, {
  deviceScaleFactor: 2
});

// Then take a screenshot at this size
const screenshot = await page.screenshot();
```

</Tab>
<Tab title="Custom HTTP Headers">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();
const page = stagehand.context.pages()[0];

// Set authorization headers for requests from this page
await page.setExtraHTTPHeaders({
  Authorization: "Bearer my-api-token",
});

// Navigate — the headers are sent with every request from this page
await page.goto("https://api.example.com/dashboard");

// Replace headers (previous headers are removed)
await page.setExtraHTTPHeaders({
  Authorization: "Bearer refreshed-token",
  "X-Request-Id": "abc-123",
});

// Clear all extra headers
await page.setExtraHTTPHeaders({});

await stagehand.close();
```

</Tab>
<Tab title="Snapshot">

```typescript
// Capture the page's accessibility tree snapshot
const { formattedTree, xpathMap, urlMap } = await page.snapshot();

// The formattedTree shows the page structure:
// [0-1] RootWebArea: Example Domain
//   [0-3] heading: Example Domain
//   [0-8] link: More information...

console.log(formattedTree);

// Use xpathMap to get the XPath selector for any element by ID
const linkXpath = xpathMap["0-8"];
console.log("Link XPath:", linkXpath); // "/html/body/div/p[2]/a"

// Use urlMap to get URLs associated with link elements
const linkUrl = urlMap["0-8"];
console.log("Link URL:", linkUrl); // "https://www.iana.org/domains/example"

// Exclude iframe content from the snapshot
const mainPageOnly = await page.snapshot({ includeIframes: false });
```

</Tab>
</Tabs>

## Types

### LoadState

```typescript
type LoadState = "load" | "domcontentloaded" | "networkidle";
```

- **`"load"`** - Wait for the `load` event (all resources loaded)
- **`"domcontentloaded"`** - Wait for the `DOMContentLoaded` event (DOM is ready)
- **`"networkidle"`** - Wait for network connections to be idle

### AnyPage

```typescript
type AnyPage = PlaywrightPage | PuppeteerPage | PatchrightPage | Page;
```

Stagehand supports multiple browser automation libraries. The `AnyPage` type represents any compatible page object.

### ScreenshotClip

```typescript
interface ScreenshotClip {
  x: number;
  y: number;
  width: number;
  height: number;
}
```

Represents the CSS-pixel rectangle to capture when `clip` is provided.

### ScreenshotOptions

```typescript
interface ScreenshotOptions {
  fullPage?: boolean;
  clip?: ScreenshotClip;
  type?: "png" | "jpeg";
  quality?: number;
  scale?: "css" | "device";
  animations?: "allow" | "disabled";
  caret?: "hide" | "initial";
  mask?: Locator[];
  maskColor?: string;
  style?: string;
  omitBackground?: boolean;
  timeout?: number;
  path?: string;
}
```

Matches Playwright's screenshot signature with sensible defaults to control how a
capture is produced.

### PageSnapshotOptions

```typescript
type PageSnapshotOptions = {
  includeIframes?: boolean;
};
```

- **`includeIframes`** - Whether to include iframe content in the snapshot. Defaults to `true`

### SnapshotResult

```typescript
type SnapshotResult = {
  formattedTree: string;
  xpathMap: Record<string, string>;
  urlMap: Record<string, string>;
};
```

- **`formattedTree`** - A formatted string representation of the page's accessibility tree with encoded IDs, roles, and names
- **`xpathMap`** - A mapping from encoded element IDs to their absolute XPath selectors
- **`urlMap`** - A mapping from encoded element IDs to their associated URLs (for links and other navigable elements)

## Error Handling

Page methods may throw the following errors:

- **Navigation Errors** - Timeout or network issues during navigation
- **Evaluation Errors** - JavaScript execution errors in `evaluate()`
- **Interaction Errors** - Failed clicks or typing operations
- **Screenshot Errors** - Issues capturing screenshots

All errors should be caught and handled appropriately:

```typescript
try {
  await page.goto("https://example.com");
} catch (error) {
  console.error("Navigation failed:", error.message);
}
```


================================================
FILE: packages/docs/v3/references/response.mdx
================================================
---
title: Response
description: 'Complete API reference for the Response object'
icon: 'reply'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Navigation" icon="compass" href="/v3/references/page">
  See how pages expose Response objects from navigation methods
</Card>
</CardGroup>

## Overview

`Response` mirrors Playwright’s [Response](https://playwright.dev/docs/api/class-response) interface and is returned from Stagehand navigation helpers such as `page.goto()`, `page.reload()`, `page.goBack()`, and `page.goForward()`. It provides a convenient way to inspect the HTTP metadata associated with a navigation, retrieve the response body on demand, and monitor when the underlying request finishes.

Stagehand automatically returns `null` for navigations that do not yield a network request (for example `data:` URLs, `about:blank`, or same-document history changes), matching Playwright’s behaviour.

## Getting a Response

```typescript
const response = await page.goto("https://example.com", {
  waitUntil: "networkidle",
});

if (!response) {
  throw new Error("Navigation did not produce a network response");
}

console.log("Status", response.status(), response.statusText());
const body = await response.text();
```

When a navigation does not produce a response object you will receive `null`, allowing you to branch early:

```typescript
const inline = await page.goto("data:text/html,<h1>inline</h1>");
if (inline === null) {
  // No network fetch happened; handle accordingly
}
```

## Status & Metadata

### url()

```typescript
response.url(): string
```

Returns the final URL associated with the navigation request.

### status()

```typescript
response.status(): number
```

Returns the HTTP status code.

### statusText()

```typescript
response.statusText(): string
```

Returns the human-readable status text (for example `OK`).

### ok()

```typescript
response.ok(): boolean
```

Convenience helper that resolves to `true` for 2xx responses and `false` otherwise.

### frame()

```typescript
response.frame(): Frame | null
```

Returns the Stagehand `Frame` that initiated the navigation. When the frame is no longer available, `null` is returned.

### fromServiceWorker()

```typescript
response.fromServiceWorker(): boolean
```

Indicates whether the response was served from a Service Worker fetch handler.

### securityDetails()

```typescript
await response.securityDetails(): Promise<Protocol.Network.SecurityDetails | null>
```

Resolves with TLS/security metadata when available (issuer, protocol, validity window). Returns `null` for insecure or non-network responses.

### serverAddr()

```typescript
await response.serverAddr(): Promise<{ ipAddress: string; port: number } | null>
```

Provides the remote IP/port reported by Chrome, when known.

## Header Helpers

### headers()

```typescript
response.headers(): Record<string, string>
```

Returns a lowercase header map, matching Playwright’s `headers()` behaviour.

### allHeaders()

```typescript
await response.allHeaders(): Promise<Record<string, string>>
```

Includes additional headers only surfaced via Chrome’s `responseReceivedExtraInfo` event (such as `set-cookie`).

### headerValue()

```typescript
await response.headerValue(name: string): Promise<string | null>
```

Returns a comma-joined string of all values for the specified header. Resolves to `null` when the header is absent.

### headerValues()

```typescript
await response.headerValues(name: string): Promise<string[]>
```

Returns an array of header values, keeping multiple entries separate.

### headersArray()

```typescript
await response.headersArray(): Promise<Array<{ name: string; value: string }>>
```

Returns the header list while preserving the original casing and order reported by the browser.

## Body Helpers

### body()

```typescript
await response.body(): Promise<Buffer>
```

Fetches the raw response body. The buffer is base64-decoded for you when Chrome sends it that way.

### text()

```typescript
await response.text(): Promise<string>
```

Returns the response body decoded as UTF-8 text.

### json()

```typescript
await response.json<T = unknown>(): Promise<T>
```

Parses the response body as JSON. Throws if the body cannot be parsed or is not valid JSON.

<Note>
All body helper calls (`body()`, `text()`, `json()`) only succeed once the browser reports the response body is available. Stagehand handles this timing automatically.
</Note>

## Completion

### finished()

```typescript
await response.finished(): Promise<null | Error>
```

Resolves to `null` when the main navigation request completes successfully, or to an `Error` if Chrome reports `Network.loadingFailed`. This mirrors Playwright’s `response.finished()` contract and is especially helpful for catching late failures such as network resets or blocked responses.

```typescript
const result = await response.finished();
if (result instanceof Error) {
  console.error("Navigation failed", result.message);
}
```

## Usage Patterns

### Inspect status and headers

```typescript
const response = await page.goto("https://httpbin.org/headers");

if (response) {
  console.log(response.status(), response.statusText());
  const headers = await response.headersArray();
  headers.forEach(({ name, value }) => {
    console.log(`${name}: ${value}`);
  });
}
```

### Handle non-network navigations

```typescript
const result = await page.goto("data:text/html,<p>inline</p>");

if (result === null) {
  console.log("No network response (data URL)");
} else {
  // Process as usual
}
```

### Await completion

```typescript
const response = await page.goto("https://example.com/slow");

if (response) {
  const finished = await response.finished();
  if (finished instanceof Error) {
    console.error("Navigation failed", finished.message);
  }
}
```

## Returned From

- `await page.goto(url, options?)`
- `await page.reload(options?)`
- `await page.goBack(options?)`
- `await page.goForward(options?)`

Each method resolves with `Response | null` depending on whether Chrome reported a document-level network response.

## See Also

- [Page reference](/v3/references/page) for details on navigation helpers


================================================
FILE: packages/docs/v3/references/stagehand.mdx
================================================
---
title: Stagehand
description: 'Complete API reference for the Stagehand class'
icon: 'hand-horns'
---
import { V3Banner } from '/snippets/v3-banner.mdx';

<V3Banner />


<CardGroup cols={1}>
<Card title="Getting Started" icon="rocket" href="/v3/first-steps/quickstart">
  The fastest way to start using Stagehand
</Card>
</CardGroup>

## Overview

The `Stagehand` class is the main entry point for Stagehand v3. It manages browser lifecycle, provides AI-powered automation methods, and handles both local and remote browser environments.

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand(options);
await stagehand.init();
```

## Constructor

### new Stagehand()

Create a new Stagehand instance.

```typescript
const stagehand = new Stagehand(options: V3Options);
```

**V3Options Interface:**
```typescript
interface V3Options {
  env: "LOCAL" | "BROWSERBASE";

  // Browserbase options (required when env = "BROWSERBASE")
  apiKey?: string;
  projectId?: string;
  browserbaseSessionID?: string;
  browserbaseSessionCreateParams?: Browserbase.Sessions.SessionCreateParams;

  // Local browser options
  localBrowserLaunchOptions?: LocalBrowserLaunchOptions;

  // AI/LLM configuration
  model?: ModelConfiguration;
  llmClient?: LLMClient;
  systemPrompt?: string;

  // Behavior options
  selfHeal?: boolean;
  experimental?: boolean;
  domSettleTimeout?: number;
  cacheDir?: string;
  keepAlive?: boolean;
  serverCache?: boolean;

  // Logging options
  verbose?: 0 | 1 | 2;
  logInferenceToFile?: boolean;
  disablePino?: boolean;
  logger?: (line: LogLine) => void;
}
```

### Configuration Parameters

<ParamField path="env" type='"LOCAL" | "BROWSERBASE"' required>
  Environment to run the browser in.

  - **`"LOCAL"`** - Run browser locally using Chrome/Chromium
  - **`"BROWSERBASE"`** - Run browser on Browserbase cloud platform
</ParamField>

#### Browserbase Options

<ParamField path="apiKey" type="string" optional>
  Browserbase API key. Required when `env` is `"BROWSERBASE"`.

  Can also be set via `BROWSERBASE_API_KEY` environment variable.
</ParamField>

<ParamField path="projectId" type="string" optional>
  Browserbase project ID. Required when `env` is `"BROWSERBASE"`.

  Can also be set via `BROWSERBASE_PROJECT_ID` environment variable.
</ParamField>

<ParamField path="browserbaseSessionID" type="string" optional>
  Resume an existing Browserbase session by ID instead of creating a new one.
</ParamField>

<ParamField path="browserbaseSessionCreateParams" type="object" optional>
  Additional parameters for Browserbase session creation. See [Browserbase documentation](https://docs.browserbase.com) for details.
</ParamField>

#### Local Browser Options

<ParamField path="localBrowserLaunchOptions" type="LocalBrowserLaunchOptions" optional>
  Configuration for local Chrome/Chromium browser.

  <Expandable title="LocalBrowserLaunchOptions">
    <ParamField path="headless" type="boolean" optional>
      Run browser in headless mode.

      **Default:** `true`
    </ParamField>

    <ParamField path="executablePath" type="string" optional>
      Path to Chrome/Chromium executable.
    </ParamField>

    <ParamField path="port" type="number" optional>
      Fixed Chrome DevTools Protocol (CDP) debugging port for external tool connections.

      **Default:** Randomly assigned
    </ParamField>

    <ParamField path="args" type="string[]" optional>
      Additional Chrome launch arguments.
    </ParamField>

    <ParamField path="userDataDir" type="string" optional>
      Path to user data directory for browser profile.
    </ParamField>

    <ParamField path="viewport" type="{ width: number; height: number }" optional>
      Default viewport size.
    </ParamField>

    <ParamField path="devtools" type="boolean" optional>
      Auto-open DevTools for each tab.

      **Default:** `false`
    </ParamField>

    <ParamField path="proxy" type="object" optional>
      Proxy configuration.

      **Properties:** `server`, `bypass`, `username`, `password`
    </ParamField>

    <ParamField path="ignoreHTTPSErrors" type="boolean" optional>
      Ignore HTTPS certificate errors.

      **Default:** `false`
    </ParamField>

    <ParamField path="cdpUrl" type="string" optional>
      Attach to existing Chrome instance via CDP WebSocket URL.
    </ParamField>
  </Expandable>
</ParamField>

#### AI/LLM Configuration

<ParamField path="model" type="ModelConfiguration" optional>
  Configure the AI model to use for automation. Can be either:
  - A string in the format `"provider/model"` (e.g., `"openai/gpt-4o"`, `"anthropic/claude-sonnet-4-6"`)
  - An object with detailed configuration

  <Expandable title="Model Configuration Object">
    <ParamField path="modelName" type="string" required>
      The model name (e.g., "gpt-4o", "claude-sonnet-4-6", "gemini-2.5-flash")
    </ParamField>
    <ParamField path="apiKey" type="string" optional>
      API key for the model provider (overrides environment variables)
    </ParamField>
    <ParamField path="baseURL" type="string" optional>
      Base URL for the API endpoint (for custom endpoints or proxies)
    </ParamField>
  </Expandable>
</ParamField>

<ParamField path="llmClient" type="LLMClient" optional>
  Provide a custom LLM client implementation instead of using the default.
</ParamField>

<ParamField path="systemPrompt" type="string" optional>
  Custom system prompt to guide AI behavior across all operations.
</ParamField>

#### Behavior Options

<ParamField path="selfHeal" type="boolean" optional>
  Enable self-healing mode where actions can recover from failures.

  **Default:** `true`
</ParamField>

<ParamField path="experimental" type="boolean" optional>
  Enable experimental features (may change between versions).

  **Default:** `false`
  <Warning>**Use with caution in production**. Experimental features may break or change between versions without notice.</Warning>

</ParamField>

<ParamField path="domSettleTimeout" type="number" optional>
  Default timeout for waiting for DOM to stabilize (in milliseconds).

  **Default:** `30000`
</ParamField>

<ParamField path="cacheDir" type="string" optional>
  Directory path for caching action observations to improve performance.
</ParamField>

<ParamField path="keepAlive" type="boolean" optional>
  Controls whether the browser remains running after `stagehand.close()` is called or the parent process exits unexpectedly.

  - **`true`** - Browser continues running independently. On Browserbase, the session stays active. Locally, the Chrome process is kept alive.
  - **`false`** - Browser is terminated and resources are cleaned up on close or crash.

  When set, this overrides any value in `browserbaseSessionCreateParams.keepAlive`.

  **Default:** `false`
</ParamField>

<ParamField path="serverCache" type="boolean" optional>
  Enable or disable server-side caching for `act()`, `extract()`, and `observe()` requests. When enabled, repeated calls with the same inputs return instantly without consuming LLM tokens.

  <Note>Only applies when `env` is `"BROWSERBASE"`. Has no effect in local environments.</Note>

  Can be overridden per-call via the `serverCache` option on `act()`, `extract()`, and `observe()`.

  **Default:** `true`
</ParamField>

#### Logging Options

<ParamField path="verbose" type="0 | 1 | 2" optional>
  Logging verbosity level.

  - **`0`** - Minimal logging
  - **`1`** - Standard logging (default)
  - **`2`** - Detailed debug logging

  **Default:** `1`
</ParamField>

<ParamField path="logInferenceToFile" type="boolean" optional>
  Log AI inference details to files for debugging.

  **Default:** `false`
</ParamField>

<ParamField path="disablePino" type="boolean" optional>
  Disable the Pino logging backend (useful for custom logging integrations).

  **Default:** `false`
</ParamField>

<ParamField path="logger" type="(line: LogLine) => void" optional>
  Custom logger function to receive log events.
</ParamField>

## Methods

### init()

Initialize the Stagehand instance and launch the browser.

```typescript
await stagehand.init(): Promise<void>
```

**Must be called before using any other methods.**

### close()

Close the browser and clean up resources.

```typescript
await stagehand.close(options?: { force?: boolean }): Promise<void>
```

<ParamField path="force" type="boolean" optional>
  Force close even if already closing.

  **Default:** `false`
</ParamField>

<Note>
When `keepAlive` is `true`, calling `close()` disconnects Stagehand from the browser without terminating it. The browser session continues running independently and can be reconnected to later using `browserbaseSessionID`. When `keepAlive` is `false` (the default), `close()` fully terminates the browser and cleans up all resources.
</Note>

### agent()

Create an AI agent instance for autonomous multi-step workflows.

```typescript
stagehand.agent(config?: AgentConfig): AgentInstance
```

See the [agent() reference](/v3/references/agent) for detailed documentation.

## Properties

### page

Access pages for browser automation. Pages are accessed through the context.

```typescript
// Get the first page (created automatically on init)
const page = stagehand.context.pages()[0];

// Or get the active page
const activePage = stagehand.context.activePage();

// Create a new page
const newPage = await stagehand.context.newPage();
```

**Type:** [`Page`](/v3/references/page)

The page object provides methods for:
- Navigation (`goto()`, `reload()`, `goBack()`, `goForward()`)
- Interaction (`click()`, `type()`, `keyPress()`, `locator()`, `deepLocator()`)
- Inspection (`url()`, `title()`, `screenshot()`)
- JavaScript evaluation (`evaluate()`)

<Note>
**Important:** AI-powered methods ([`act()`](/v3/references/act), [`extract()`](/v3/references/extract), [`observe()`](/v3/references/observe)) are called on the stagehand instance, not on the page object.
</Note>

### context

Access the browser context for managing multiple pages.

```typescript
const context = stagehand.context;
```

**Type:** `V3Context`

The context object provides:
- `newPage()` - Create a new page/tab
- `pages()` - Get all open pages
- `setActivePage(page)` - Switch active page

### metrics

Get usage metrics for AI operations.

```typescript
const metrics = await stagehand.metrics;
```

**Returns:** `Promise<StagehandMetrics>`

**StagehandMetrics Interface:**
```typescript
interface StagehandMetrics {
  // Act metrics
  actPromptTokens: number;
  actCompletionTokens: number;
  actReasoningTokens: number;
  actCachedInputTokens: number;
  actInferenceTimeMs: number;

  // Extract metrics
  extractPromptTokens: number;
  extractCompletionTokens: number;
  extractReasoningTokens: number;
  extractCachedInputTokens: number;
  extractInferenceTimeMs: number;

  // Observe metrics
  observePromptTokens: number;
  observeCompletionTokens: number;
  observeReasoningTokens: number;
  observeCachedInputTokens: number;
  observeInferenceTimeMs: number;

  // Agent metrics
  agentPromptTokens: number;
  agentCompletionTokens: number;
  agentReasoningTokens: number;
  agentCachedInputTokens: number;
  agentInferenceTimeMs: number;

  // Totals
  totalPromptTokens: number;
  totalCompletionTokens: number;
  totalReasoningTokens: number;
  totalCachedInputTokens: number;
  totalInferenceTimeMs: number;
}
```

### history

Get the history of all operations performed.

```typescript
const history = await stagehand.history;
```

**Returns:** `Promise<ReadonlyArray<HistoryEntry>>`

**HistoryEntry Interface:**
```typescript
interface HistoryEntry {
  method: "act" | "extract" | "observe" | "navigate";
  parameters: unknown;
  result: unknown;
  timestamp: string;
}
```

### browserbaseSessionID

Browserbase session identifier for the active Browserbase run.

```typescript
const sessionId = stagehand.browserbaseSessionID;
```

**Type:** `string | undefined` — undefined for LOCAL runs or before `init()`.

### browserbaseSessionURL

Shareable link to the active Browserbase session dashboard.

```typescript
const sessionUrl = stagehand.browserbaseSessionURL;
```

**Type:** `string | undefined` — undefined until a Browserbase session is active.

### browserbaseDebugURL

Debugger URL returned by Browserbase for direct CDP inspection.

```typescript
const debugUrl = stagehand.browserbaseDebugURL;
```

**Type:** `string | undefined` — undefined for LOCAL runs or if Browserbase doesn’t provide one.

## Code Examples

<Tabs>
<Tab title="Browserbase">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Remote browser on Browserbase
const stagehand = new Stagehand({
  env: "BROWSERBASE",
  apiKey: process.env.BROWSERBASE_API_KEY,
  projectId: process.env.BROWSERBASE_PROJECT_ID,
  model: "anthropic/claude-sonnet-4-6"
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");
const data = await stagehand.extract("get page title", z.object({
  title: z.string()
}));

await stagehand.close();
```

</Tab>
<Tab title="Local">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

// Local browser
const stagehand = new Stagehand({
  env: "LOCAL",
  model: "openai/gpt-4o"
});

await stagehand.init();
const page = stagehand.context.pages()[0];

// Use the page
await page.goto("https://example.com");
await stagehand.act("click the login button");

// Cleanup
await stagehand.close();
```

</Tab>
<Tab title="Custom Model Config">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  model: {
    modelName: "gpt-4o",
    apiKey: process.env.OPENAI_API_KEY,
    baseURL: "https://custom-proxy.com/v1"
  },
  systemPrompt: "You are a helpful automation assistant.",
  verbose: 2,
  selfHeal: true
});

await stagehand.init();
```

</Tab>
<Tab title="Multi-Page">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({ env: "LOCAL" });
await stagehand.init();

// Get the first page
const page1 = stagehand.context.pages()[0];
await page1.goto("https://example.com");

// Create second page
const page2 = await stagehand.context.newPage();
await page2.goto("https://another-site.com");

// Switch active page
stagehand.context.setActivePage(page2);

// Now context.activePage() returns page2
await stagehand.act("click the button");

await stagehand.close();
```

</Tab>
<Tab title="With Metrics">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  model: "openai/gpt-4o"
});

await stagehand.init();
const page = stagehand.context.pages()[0];

await page.goto("https://example.com");
await stagehand.act("fill out the form");
await stagehand.extract("get form data", schema);

// Get usage metrics
const metrics = await stagehand.metrics;
console.log("Total tokens used:", metrics.totalPromptTokens + metrics.totalCompletionTokens);
console.log("Act operations:", {
  tokens: metrics.actPromptTokens + metrics.actCompletionTokens,
  time: metrics.actInferenceTimeMs
});

await stagehand.close();
```

</Tab>
<Tab title="With Custom Logger">

```typescript
import { Stagehand } from "@browserbasehq/stagehand";

const stagehand = new Stagehand({
  env: "LOCAL",
  verbose: 2,
  logger: (logLine) => {
    console.log(`[${logLine.category}] ${logLine.message}`);
    if (logLine.auxiliary) {
      console.log("Details:", logLine.auxiliary);
    }
  }
});

await stagehand.init();
// All operations will now log through your custom logger
```

</Tab>
</Tabs>

## Error Handling

Stagehand methods may throw the following errors:

- **StagehandInitError** - Failed to initialize Stagehand
- **StagehandNotInitializedError** - Methods called before `init()`
- **BrowserbaseSessionNotFoundError** - Browserbase session not found
- **MissingLLMConfigurationError** - No LLM API key or client configured
- **MissingEnvironmentVariableError** - Required environment variable not set
- **StagehandEnvironmentError** - Invalid environment configuration

Always handle errors appropriately:

```typescript
try {
  const stagehand = new Stagehand({ env: "LOCAL" });
  await stagehand.init();
  // ... use stagehand
} catch (error) {
  console.error("Stagehand error:", error.message);
} finally {
  await stagehand?.close();
}
```

## Best Practices

1. **Always call `init()`** before using any other methods
2. **Always call `close()`** when done to clean up resources
3. **Use try-finally** to ensure cleanup even on errors
4. **Set appropriate timeouts** based on your use case
5. **Enable `selfHeal`** for more robust automation
6. **Use metrics** to monitor token usage and costs
7. **Configure custom logger** for production debugging
8. **Cache directory** can significantly improve performance for repeated actions

## Environment Variables

Stagehand recognizes the following environment variables:

- `BROWSERBASE_API_KEY` - Browserbase API key
- `BROWSERBASE_PROJECT_ID` - Browserbase project ID
- `OPENAI_API_KEY` - OpenAI API key
- `ANTHROPIC_API_KEY` - Anthropic API key
- `GOOGLE_API_KEY` - Google AI API key

These can be overridden by passing values in the constructor options.


================================================
FILE: packages/docs/v3/sdk/go.mdx
================================================
---
title: "Go SDK"
description: "Official Stagehand SDK for Go"
---

<Note>
  This documentation is automatically synced from the [Go SDK GitHub repository](https://github.com/browserbase/stagehand-go).
</Note>

## What is Stagehand?

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## Why Stagehand?

Most existing browser automation tools either require you to write low-level code in a framework like Selenium, Playwright, or Puppeteer, or use high-level agents that can be unpredictable in production. By letting developers choose what to write in code vs. natural language (and bridging the gap between the two) Stagehand is the natural choice for browser automations in production.

1. **Choose when to write code vs. natural language**: use AI when you want to navigate unfamiliar pages, and use code when you know exactly what you want to do.

2. **Go from AI-driven to repeatable workflows**: Stagehand lets you preview AI actions before running them, and also helps you easily cache repeatable actions to save time and tokens.

3. **Write once, run forever**: Stagehand's auto-caching combined with self-healing remembers previous actions, runs without LLM inference, and knows when to involve AI whenever the website changes and your automation breaks.

## Installation

```go
import (
	"github.com/browserbase/stagehand-go" // imported as stagehand
)
```

Or to pin the version:

```sh
go get -u 'github.com/browserbase/stagehand-go@v0.17.1'
```

## Requirements

This library requires Go 1.22+.

## Usage

The full API of this library can be found in [api.md](https://github.com/browserbase/stagehand-go/blob/main/api.md).

```go
package main

import (
	"context"
	"fmt"

	"github.com/browserbase/stagehand-go"
	"github.com/browserbase/stagehand-go/option"
)

func main() {
	// Create a new Stagehand client with your credentials
	client := stagehand.NewClient(
		option.WithBrowserbaseAPIKey("My Browserbase API Key"),       // defaults to os.LookupEnv("BROWSERBASE_API_KEY")
		option.WithBrowserbaseProjectID("My Browserbase Project ID"), // defaults to os.LookupEnv("BROWSERBASE_PROJECT_ID")
		option.WithModelAPIKey("My Model API Key"),                   // defaults to os.LookupEnv("MODEL_API_KEY")
	)

	// Start a new browser session
	startResponse, err := client.Sessions.Start(context.TODO(), stagehand.SessionStartParams{
		ModelName: "gpt-5-nano",
	})
	if err != nil {
		panic(err.Error())
	}
	fmt.Printf("Session started: %s\n", startResponse.Data.SessionID)

	sessionID := startResponse.Data.SessionID

	// Navigate to a webpage
	_, err = client.Sessions.Navigate(
		context.TODO(),
		sessionID,
		stagehand.SessionNavigateParams{
			URL: "https://news.ycombinator.com",
		},
	)
	if err != nil {
		panic(err.Error())
	}
	fmt.Println("Navigated to Hacker News")

	// Use Observe to find possible actions on the page
	observeResponse, err := client.Sessions.Observe(
		context.TODO(),
		sessionID,
		stagehand.SessionObserveParams{
			Instruction: stagehand.String("find the link to view comments for the top post"),
		},
	)
	if err != nil {
		panic(err.Error())
	}

	actions := observeResponse.Data.Result
	fmt.Printf("Found %d possible actions\n", len(actions))

	if len(actions) == 0 {
		fmt.Println("No actions found")
		return
	}

	// Take the first action returned by Observe
	action := actions[0]
	fmt.Printf("Acting on: %s\n", action.Description)

	// Pass the structured action to Act
	// The action contains selector, description, method, and arguments
	actResponse, err := client.Sessions.Act(
		context.TODO(),
		sessionID,
		stagehand.SessionActParams{
			Input: stagehand.SessionActParamsInputUnion{
				OfAction: &stagehand.ActionParam{
					Description: action.Description,
					Selector:    action.Selector,
					Method:      stagehand.String(action.Method),
					Arguments:   action.Arguments,
				},
			},
		},
	)
	if err != nil {
		panic(err.Error())
	}
	fmt.Printf("Act completed: %s\n", actResponse.Data.Result.Message)

	// Extract structured data from the page using a JSON schema
	extractResponse, err := client.Sessions.Extract(
		context.TODO(),
		sessionID,
		stagehand.SessionExtractParams{
			Instruction: stagehand.String("extract the text of the top comment"),
			Schema: map[string]any{
				"type": "object",
				"properties": map[string]any{
					"commentText": map[string]any{
						"type":        "string",
						"description": "The text content of the top comment",
					},
					"author": map[string]any{
						"type":        "string",
						"description": "The username of the comment author",
					},
				},
			},
		},
	)
	if err != nil {
		panic(err.Error())
	}
	fmt.Printf("Extracted: %+v\n", extractResponse.Data.Result)

	// Run an autonomous agent to accomplish a goal
	// The agent can navigate, click, type, and interact with pages
	executeResponse, err := client.Sessions.Execute(
		context.TODO(),
		sessionID,
		stagehand.SessionExecuteParams{
			ExecuteOptions: stagehand.SessionExecuteParamsExecuteOptions{
				Instruction: "Find the profile page for the top commenter",
				MaxSteps:    stagehand.Float(10),
			},
			AgentConfig: stagehand.SessionExecuteParamsAgentConfig{
				// Model config with provider/model format and API key
				Model: stagehand.ModelConfigUnionParam{
					OfModelConfigModelConfigObject: &stagehand.ModelConfigModelConfigObjectParam{
						ModelName: "openai/gpt-4.1-mini",
						APIKey:    stagehand.String("sk-your-api-key"),
					},
				},
				Cua: stagehand.Bool(false),
			},
		},
	)
	if err != nil {
		panic(err.Error())
	}
	fmt.Printf("Agent result: %s\n", executeResponse.Data.Result.Message)

	// End the session to clean up resources
	_, err = client.Sessions.End(
		context.TODO(),
		sessionID,
		stagehand.SessionEndParams{},
	)
	if err != nil {
		panic(err.Error())
	}
	fmt.Println("Session ended")
}
```

### Running the example

A complete working example is available in `examples/basic.go`. To run it:

1. **Set up environment variables** by creating a `.env` file in the repository root:

```bash
BROWSERBASE_API_KEY=your_browserbase_api_key
BROWSERBASE_PROJECT_ID=your_browserbase_project_id
MODEL_API_KEY=your_openai_api_key
```

You can get your Browserbase API key and project ID from the [Browserbase dashboard](https://www.browserbase.com/).

2. **Install dependencies**:

```bash
go mod tidy
```

3. **Run the example**:

```bash
go run examples/basic.go
```

The example demonstrates the full Stagehand workflow: starting a session, navigating to a page, observing actions, clicking elements, extracting data, and running an autonomous agent.

### Request fields

The stagehand library uses the [`omitzero`](https://tip.golang.org/doc/go1.24#encodingjsonpkgencodingjson)
semantics from the Go 1.24+ `encoding/json` release for request fields.

Required primitive fields (`int64`, `string`, etc.) feature the tag `json:"...,required"`. These
fields are always serialized, even their zero values.

Optional primitive types are wrapped in a `param.Opt[T]`. These fields can be set with the provided constructors, `stagehand.String(string)`, `stagehand.Int(int64)`, etc.

Any `param.Opt[T]`, map, slice, struct or string enum uses the
tag `json:"...,omitzero"`. Its zero value is considered omitted.

The `param.IsOmitted(any)` function can confirm the presence of any `omitzero` field.

```go
p := stagehand.ExampleParams{
	ID:   "id_xxx",                // required property
	Name: stagehand.String("..."), // optional property

	Point: stagehand.Point{
		X: 0,                // required field will serialize as 0
		Y: stagehand.Int(1), // optional field will serialize as 1
		// ... omitted non-required fields will not be serialized
	},

	Origin: stagehand.Origin{}, // the zero value of [Origin] is considered omitted
}
```

To send `null` instead of a `param.Opt[T]`, use `param.Null[T]()`.
To send `null` instead of a struct `T`, use `param.NullStruct[T]()`.

```go
p.Name = param.Null[string]()       // 'null' instead of string
p.Point = param.NullStruct[Point]() // 'null' instead of struct

param.IsNull(p.Name)  // true
param.IsNull(p.Point) // true
```

Request structs contain a `.SetExtraFields(map[string]any)` method which can send non-conforming
fields in the request body. Extra fields overwrite any struct fields with a matching
key. For security reasons, only use `SetExtraFields` with trusted data.

To send a custom value instead of a struct, use `param.Override[T](https://github.com/browserbase/stagehand-go/blob/main/value)`.

```go
// In cases where the API specifies a given type,
// but you want to send something else, use [SetExtraFields]:
p.SetExtraFields(map[string]any{
	"x": 0.01, // send "x" as a float instead of int
})

// Send a number instead of an object
custom := param.Override[stagehand.FooParams](https://github.com/browserbase/stagehand-go/blob/main/12)
```

### Request unions

Unions are represented as a struct with fields prefixed by "Of" for each of its variants,
only one field can be non-zero. The non-zero field will be serialized.

Sub-properties of the union can be accessed via methods on the union struct.
These methods return a mutable pointer to the underlying data, if present.

```go
// Only one field can be non-zero, use param.IsOmitted() to check if a field is set
type AnimalUnionParam struct {
	OfCat *Cat `json:",omitzero,inline`
	OfDog *Dog `json:",omitzero,inline`
}

animal := AnimalUnionParam{
	OfCat: &Cat{
		Name: "Whiskers",
		Owner: PersonParam{
			Address: AddressParam{Street: "3333 Coyote Hill Rd", Zip: 0},
		},
	},
}

// Mutating a field
if address := animal.GetOwner().GetAddress(); address != nil {
	address.ZipCode = 94304
}
```

### Response objects

All fields in response structs are ordinary value types (not pointers or wrappers).
Response structs also include a special `JSON` field containing metadata about
each property.

```go
type Animal struct {
	Name   string `json:"name,nullable"`
	Owners int    `json:"owners"`
	Age    int    `json:"age"`
	JSON   struct {
		Name        respjson.Field
		Owner       respjson.Field
		Age         respjson.Field
		ExtraFields map[string]respjson.Field
	} `json:"-"`
}
```

To handle optional data, use the `.Valid()` method on the JSON field.
`.Valid()` returns true if a field is not `null`, not present, or couldn't be marshaled.

If `.Valid()` is false, the corresponding field will simply be its zero value.

```go
raw := `{"owners": 1, "name": null}`

var res Animal
json.Unmarshal([]byte(raw), &res)

// Accessing regular fields

res.Owners // 1
res.Name   // ""
res.Age    // 0

// Optional field checks

res.JSON.Owners.Valid() // true
res.JSON.Name.Valid()   // false
res.JSON.Age.Valid()    // false

// Raw JSON values

res.JSON.Owners.Raw()                  // "1"
res.JSON.Name.Raw() == "null"          // true
res.JSON.Name.Raw() == respjson.Null   // true
res.JSON.Age.Raw() == ""               // true
res.JSON.Age.Raw() == respjson.Omitted // true
```

These `.JSON` structs also include an `ExtraFields` map containing
any properties in the json response that were not specified
in the struct. This can be useful for API features not yet
present in the SDK.

```go
body := res.JSON.ExtraFields["my_unexpected_field"].Raw()
```

### Response Unions

In responses, unions are represented by a flattened struct containing all possible fields from each of the
object variants.
To convert it to a variant use the `.AsFooVariant()` method or the `.AsAny()` method if present.

If a response value union contains primitive values, primitive fields will be alongside
the properties but prefixed with `Of` and feature the tag `json:"...,inline"`.

```go
type AnimalUnion struct {
	// From variants [Dog], [Cat]
	Owner Person `json:"owner"`
	// From variant [Dog]
	DogBreed string `json:"dog_breed"`
	// From variant [Cat]
	CatBreed string `json:"cat_breed"`
	// ...

	JSON struct {
		Owner respjson.Field
		// ...
	} `json:"-"`
}

// If animal variant
if animal.Owner.Address.ZipCode == "" {
	panic("missing zip code")
}

// Switch on the variant
switch variant := animal.AsAny().(type) {
case Dog:
case Cat:
default:
	panic("unexpected type")
}
```

### RequestOptions

This library uses the functional options pattern. Functions defined in the
`option` package return a `RequestOption`, which is a closure that mutates a
`RequestConfig`. These options can be supplied to the client or at individual
requests. For example:

```go
client := stagehand.NewClient(
	// Adds a header to every request made by the client
	option.WithHeader("X-Some-Header", "custom_header_info"),
)

client.Sessions.Start(context.TODO(), ...,
	// Override the header
	option.WithHeader("X-Some-Header", "some_other_custom_header_info"),
	// Add an undocumented field to the request body, using sjson syntax
	option.WithJSONSet("some.json.path", map[string]string{"my": "object"}),
)
```

The request option `option.WithDebugLog(nil)` may be helpful while debugging.

See the [full list of request options](https://pkg.go.dev/github.com/browserbase/stagehand-go/option).

### Errors

When the API returns a non-success status code, we return an error with type
`*stagehand.Error`. This contains the `StatusCode`, `*http.Request`, and
`*http.Response` values of the request, as well as the JSON of the error body
(much like other response objects in the SDK).

To handle errors, we recommend that you use the `errors.As` pattern:

```go
_, err := client.Sessions.Start(context.TODO(), stagehand.SessionStartParams{
	ModelName: "openai/gpt-5-nano",
})
if err != nil {
	var apierr *stagehand.Error
	if errors.As(err, &apierr) {
		println(string(apierr.DumpRequest(true)))  // Prints the serialized HTTP request
		println(string(apierr.DumpResponse(true))) // Prints the serialized HTTP response
	}
	panic(err.Error()) // GET "/v1/sessions/start": 400 Bad Request { ... }
}
```

When other errors occur, they are returned unwrapped; for example,
if HTTP transport fails, you might receive `*url.Error` wrapping `*net.OpError`.

### Timeouts

Requests do not time out by default; use context to configure a timeout for a request lifecycle.

Note that if a request is [retried](#retries), the context timeout does not start over.
To set a per-retry timeout, use `option.WithRequestTimeout()`.

```go
// This sets the timeout for the request, including all the retries.
ctx, cancel := context.WithTimeout(context.Background(), 5*time.Minute)
defer cancel()
client.Sessions.Start(
	ctx,
	stagehand.SessionStartParams{
		ModelName: "openai/gpt-5-nano",
	},
	// This sets the per-retry timeout
	option.WithRequestTimeout(20*time.Second),
)
```

### Retries

Certain errors will be automatically retried 2 times by default, with a short exponential backoff.
We retry by default all connection errors, 408 Request Timeout, 409 Conflict, 429 Rate Limit,
and >=500 Internal errors.

You can use the `WithMaxRetries` option to configure or disable this:

```go
// Configure the default for all requests:
client := stagehand.NewClient(
	option.WithMaxRetries(0), // default is 2
)

// Override per-request:
client.Sessions.Start(
	context.TODO(),
	stagehand.SessionStartParams{
		ModelName: "openai/gpt-5-nano",
	},
	option.WithMaxRetries(5),
)
```

### Accessing raw response data (e.g. response headers)

You can access the raw HTTP response data by using the `option.WithResponseInto()` request option. This is useful when
you need to examine response headers, status codes, or other details.

```go
// Create a variable to store the HTTP response
var response *http.Response
response, err := client.Sessions.Start(
	context.TODO(),
	stagehand.SessionStartParams{
		ModelName: "openai/gpt-5-nano",
	},
	option.WithResponseInto(&response),
)
if err != nil {
	// handle error
}
fmt.Printf("%+v\n", response)

fmt.Printf("Status Code: %d\n", response.StatusCode)
fmt.Printf("Headers: %+#v\n", response.Header)
```

### Making custom/undocumented requests

This library is typed for convenient access to the documented API. If you need to access undocumented
endpoints, params, or response properties, the library can still be used.

#### Undocumented endpoints

To make requests to undocumented endpoints, you can use `client.Get`, `client.Post`, and other HTTP verbs.
`RequestOptions` on the client, such as retries, will be respected when making these requests.

```go
var (
    // params can be an io.Reader, a []byte, an encoding/json serializable object,
    // or a "…Params" struct defined in this library.
    params map[string]any

    // result can be an []byte, *http.Response, a encoding/json deserializable object,
    // or a model defined in this library.
    result *http.Response
)
err := client.Post(context.Background(), "/unspecified", params, &result)
if err != nil {
    …
}
```

#### Undocumented request params

To make requests using undocumented parameters, you may use either the `option.WithQuerySet()`
or the `option.WithJSONSet()` methods.

```go
params := FooNewParams{
    ID:   "id_xxxx",
    Data: FooNewParamsData{
        FirstName: stagehand.String("John"),
    },
}
client.Foo.New(context.Background(), params, option.WithJSONSet("data.last_name", "Doe"))
```

#### Undocumented response properties

To access undocumented response properties, you may either access the raw JSON of the response as a string
with `result.JSON.RawJSON()`, or get the raw JSON of a particular field on the result with
`result.JSON.Foo.Raw()`.

Any fields that are not present on the response struct will be saved and can be accessed by `result.JSON.ExtraFields()` which returns the extra fields as a `map[string]Field`.

### Middleware

We provide `option.WithMiddleware` which applies the given
middleware to requests.

```go
func Logger(req *http.Request, next option.MiddlewareNext) (res *http.Response, err error) {
	// Before the request
	start := time.Now()
	LogReq(req)

	// Forward the request to the next handler
	res, err = next(req)

	// Handle stuff after the request
	end := time.Now()
	LogRes(res, err, start - end)

    return res, err
}

client := stagehand.NewClient(
	option.WithMiddleware(Logger),
)
```

When multiple middlewares are provided as variadic arguments, the middlewares
are applied left to right. If `option.WithMiddleware` is given
multiple times, for example first in the client then the method, the
middleware in the client will run first and the middleware given in the method
will run next.

You may also replace the default `http.Client` with
`option.WithHTTPClient(client)`. Only one http client is
accepted (this overwrites any previous client) and receives requests after any
middleware has been applied.

## Semantic versioning

This package generally follows [SemVer](https://semver.org/spec/v2.0.0.html) conventions, though certain backwards-incompatible changes may be released as minor versions:

1. Changes to library internals which are technically public but not intended or documented for external use. _(Please open a GitHub issue to let us know if you are relying on such internals.)_
2. Changes that we do not expect to impact the vast majority of users in practice.

We take backwards-compatibility seriously and work hard to ensure you can rely on a smooth upgrade experience.

We are keen for your feedback; please open an [issue](https://www.github.com/browserbase/stagehand-go/issues) with questions, bugs, or suggestions.

## Contributing

See [the contributing documentation](https://github.com/browserbase/stagehand-go/blob/main/./CONTRIBUTING.md).

================================================
FILE: packages/docs/v3/sdk/java.mdx
================================================
---
title: "Java SDK"
description: "Official Stagehand SDK for Java"
---

<Note>
  This documentation is automatically synced from the [Java SDK GitHub repository](https://github.com/browserbase/stagehand-java).
</Note>

## What is Stagehand?

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## Why Stagehand?

Most existing browser automation tools either require you to write low-level code in a framework like Selenium, Playwright, or Puppeteer, or use high-level agents that can be unpredictable in production. By letting developers choose what to write in code vs. natural language (and bridging the gap between the two) Stagehand is the natural choice for browser automations in production.

1. **Choose when to write code vs. natural language**: use AI when you want to navigate unfamiliar pages, and use code when you know exactly what you want to do.

2. **Go from AI-driven to repeatable workflows**: Stagehand lets you preview AI actions before running them, and also helps you easily cache repeatable actions to save time and tokens.

3. **Write once, run forever**: Stagehand's auto-caching combined with self-healing remembers previous actions, runs without LLM inference, and knows when to involve AI whenever the website changes and your automation breaks.

## Installation

### Gradle

```java
implementation("com.browserbase.api:stagehand-java:0.6.1")
```

### Maven

```xml
<dependency>
  <groupId>com.browserbase.api</groupId>
  <artifactId>stagehand-java</artifactId>
  <version>0.6.1</version>
</dependency>
```

## Requirements

This library requires Java 8 through Java 21. Java 22+ is not currently supported.

## Running the Example

A complete working example is available at [`stagehand-java-example/src/main/java/com/stagehand/api/example/Main.java`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-example/src/main/java/com/stagehand/api/example/Main.java).

To run it, first export the required environment variables, then use Gradle:

```bash
export BROWSERBASE_API_KEY="your-bb-api-key"
export BROWSERBASE_PROJECT_ID="your-bb-project-uuid"
export MODEL_API_KEY="sk-proj-your-llm-api-key"

./gradlew :stagehand-java-example:run
```

## Usage

This example demonstrates the full Stagehand workflow: starting a session, navigating to a page, observing possible actions, acting on elements, extracting data, and running an autonomous agent.

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;
import com.browserbase.api.core.JsonValue;
import com.browserbase.api.models.sessions.*;

import java.util.List;
import java.util.Map;
import java.util.Optional;

public class Main {
    public static void main(String[] args) {
        // Create client using environment variables:
        // BROWSERBASE_API_KEY, BROWSERBASE_PROJECT_ID, MODEL_API_KEY
        StagehandClient client = StagehandOkHttpClient.fromEnv();

        // Start a new browser session
        SessionStartResponse startResponse = client.sessions().start(
            SessionStartParams.builder()
                .modelName("openai/gpt-5-nano")
                .build()
        );

        String sessionId = startResponse.data().sessionId();
        System.out.println("Session started: " + sessionId);

        try {
            // Navigate to a webpage
            client.sessions().navigate(
                SessionNavigateParams.builder()
                    .id(sessionId)
                    .url("https://news.ycombinator.com")
                    .build()
            );
            System.out.println("Navigated to Hacker News");

            // Observe to find possible actions on the page
            SessionObserveResponse observeResponse = client.sessions().observe(
                SessionObserveParams.builder()
                    .id(sessionId)
                    .instruction("find the link to view comments for the top post")
                    .build()
            );

            List<SessionObserveResponse.Data.Result> results = observeResponse.data().result();
            System.out.println("Found " + results.size() + " possible actions");

            if (results.isEmpty()) {
                System.out.println("No actions found");
                return;
            }

            // Take the first action returned by Observe
            // Convert the result to an Action to pass to Act
            SessionObserveResponse.Data.Result result = results.get(0);
            Action action = JsonValue.from(result).convert(Action.class);
            System.out.println("Acting on: " + action.description());

            // Pass the structured action to Act
            SessionActResponse actResponse = client.sessions().act(
                SessionActParams.builder()
                    .id(sessionId)
                    .input(action)
                    .build()
            );
            System.out.println("Act completed: " + actResponse.data().result().message());

            // Extract structured data from the page using a JSON schema
            SessionExtractResponse extractResponse = client.sessions().extract(
                SessionExtractParams.builder()
                    .id(sessionId)
                    .instruction("extract the text of the top comment on this page")
                    .schema(SessionExtractParams.Schema.builder()
                        .putAdditionalProperty("type", JsonValue.from("object"))
                        .putAdditionalProperty("properties", JsonValue.from(Map.of(
                            "commentText", Map.of(
                                "type", "string",
                                "description", "The text content of the top comment"
                            ),
                            "author", Map.of(
                                "type", "string",
                                "description", "The username of the comment author"
                            )
                        )))
                        .putAdditionalProperty("required", JsonValue.from(List.of("commentText")))
                        .build())
                    .build()
            );

            JsonValue extractedResult = extractResponse.data()._result();
            System.out.println("Extracted data: " + extractedResult);

            // Get the author from the extracted data
            String author = extractedResult.asObject()
                .flatMap(obj -> Optional.ofNullable(obj.get("author")))
                .flatMap(JsonValue::asString)
                .orElse("unknown");
            System.out.println("Looking up profile for author: " + author);

            // Run an autonomous agent to accomplish a complex task
            SessionExecuteResponse executeResponse = client.sessions().execute(
                SessionExecuteParams.builder()
                    .id(sessionId)
                    .executeOptions(SessionExecuteParams.ExecuteOptions.builder()
                        .instruction(String.format(
                            "Find any personal website, GitHub, or LinkedIn profile for user '%s'. " +
                            "Click on their username to view their profile page.",
                            author
                        ))
                        .maxSteps(10.0)
                        .build())
                    .agentConfig(SessionExecuteParams.AgentConfig.builder()
                        .model(ModelConfig.ofModelConfigObject(
                            ModelConfig.ModelConfigObject.builder()
                                .modelName("openai/gpt-5-nano")
                                .apiKey(System.getenv("MODEL_API_KEY"))
                                .build()
                        ))
                        .cua(false)
                        .build())
                    .build()
            );

            System.out.println("Agent completed: " + executeResponse.data().result().message());
            System.out.println("Agent success: " + executeResponse.data().result().success());

        } finally {
            // End the browser session to clean up resources
            client.sessions().end(
                SessionEndParams.builder()
                    .id(sessionId)
                    .build()
            );
            System.out.println("Session ended");
        }
    }
}
```

## Client configuration

Configure the client using system properties or environment variables:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;

// Configures using the `stagehand.browserbaseApiKey`, `stagehand.browserbaseProjectId`, `stagehand.modelApiKey` and `stagehand.baseUrl` system properties
// Or configures using the `BROWSERBASE_API_KEY`, `BROWSERBASE_PROJECT_ID`, `MODEL_API_KEY` and `STAGEHAND_BASE_URL` environment variables
StagehandClient client = StagehandOkHttpClient.fromEnv();
```

Or manually:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;

StagehandClient client = StagehandOkHttpClient.builder()
    .browserbaseApiKey("My Browserbase API Key")
    .browserbaseProjectId("My Browserbase Project ID")
    .modelApiKey("My Model API Key")
    .build();
```

Or using a combination of the two approaches:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;

StagehandClient client = StagehandOkHttpClient.builder()
    // Configures using the `stagehand.browserbaseApiKey`, `stagehand.browserbaseProjectId`, `stagehand.modelApiKey` and `stagehand.baseUrl` system properties
    // Or configures using the `BROWSERBASE_API_KEY`, `BROWSERBASE_PROJECT_ID`, `MODEL_API_KEY` and `STAGEHAND_BASE_URL` environment variables
    .fromEnv()
    .browserbaseApiKey("My Browserbase API Key")
    .build();
```

See this table for the available options:

| Setter                 | System property                  | Environment variable     | Required | Default value                             |
| ---------------------- | -------------------------------- | ------------------------ | -------- | ----------------------------------------- |
| `browserbaseApiKey`    | `stagehand.browserbaseApiKey`    | `BROWSERBASE_API_KEY`    | true     | -                                         |
| `browserbaseProjectId` | `stagehand.browserbaseProjectId` | `BROWSERBASE_PROJECT_ID` | true     | -                                         |
| `modelApiKey`          | `stagehand.modelApiKey`          | `MODEL_API_KEY`          | true     | -                                         |
| `baseUrl`              | `stagehand.baseUrl`              | `STAGEHAND_BASE_URL`     | true     | `"https://api.stagehand.browserbase.com"` |

System properties take precedence over environment variables.

> [!TIP]
> Don't create more than one client in the same application. Each client has a connection pool and
> thread pools, which are more efficient to share between requests.

### Modifying configuration

To temporarily use a modified client configuration, while reusing the same connection and thread pools, call `withOptions()` on any client or service:

```java
import com.browserbase.api.client.StagehandClient;

StagehandClient clientWithOptions = client.withOptions(optionsBuilder -> {
    optionsBuilder.modelApiKey("sk-your-llm-api-key-here");
    optionsBuilder.maxRetries(42);
});
```

The `withOptions()` method does not affect the original client or service.

## Requests and responses

To send a request to the Stagehand API, build an instance of some `Params` class and pass it to the corresponding client method. When the response is received, it will be deserialized into an instance of a Java class.

For example, `client.sessions().act(...)` should be called with an instance of `SessionActParams`, and it will return an instance of `SessionActResponse`.

## Immutability

Each class in the SDK has an associated [builder](https://blogs.oracle.com/javamagazine/post/exploring-joshua-blochs-builder-design-pattern-in-java) or factory method for constructing it.

Each class is [immutable](https://docs.oracle.com/javase/tutorial/essential/concurrency/immutable.html) once constructed. If the class has an associated builder, then it has a `toBuilder()` method, which can be used to convert it back to a builder for making a modified copy.

Because each class is immutable, builder modification will _never_ affect already built class instances.

## Asynchronous execution

The default client is synchronous. To switch to asynchronous execution, call the `async()` method:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;
import com.browserbase.api.models.sessions.SessionActParams;
import com.browserbase.api.models.sessions.SessionActResponse;
import java.util.concurrent.CompletableFuture;

// Configures using the `stagehand.browserbaseApiKey`, `stagehand.browserbaseProjectId`, `stagehand.modelApiKey` and `stagehand.baseUrl` system properties
// Or configures using the `BROWSERBASE_API_KEY`, `BROWSERBASE_PROJECT_ID`, `MODEL_API_KEY` and `STAGEHAND_BASE_URL` environment variables
StagehandClient client = StagehandOkHttpClient.fromEnv();

SessionActParams params = SessionActParams.builder()
    .id("00000000-your-session-id-000000000000")
    .input("click the first link on the page")
    .build();
CompletableFuture<SessionActResponse> response = client.async().sessions().act(params);
```

Or create an asynchronous client from the beginning:

```java
import com.browserbase.api.client.StagehandClientAsync;
import com.browserbase.api.client.okhttp.StagehandOkHttpClientAsync;
import com.browserbase.api.models.sessions.SessionActParams;
import com.browserbase.api.models.sessions.SessionActResponse;
import java.util.concurrent.CompletableFuture;

// Configures using the `stagehand.browserbaseApiKey`, `stagehand.browserbaseProjectId`, `stagehand.modelApiKey` and `stagehand.baseUrl` system properties
// Or configures using the `BROWSERBASE_API_KEY`, `BROWSERBASE_PROJECT_ID`, `MODEL_API_KEY` and `STAGEHAND_BASE_URL` environment variables
StagehandClientAsync client = StagehandOkHttpClientAsync.fromEnv();

SessionActParams params = SessionActParams.builder()
    .id("00000000-your-session-id-000000000000")
    .input("click the first link on the page")
    .build();
CompletableFuture<SessionActResponse> response = client.sessions().act(params);
```

The asynchronous client supports the same options as the synchronous one, except most methods return `CompletableFuture`s.

## Streaming

The SDK defines methods that return response "chunk" streams, where each chunk can be individually processed as soon as it arrives instead of waiting on the full response. Streaming methods generally correspond to [SSE](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events) or [JSONL](https://jsonlines.org) responses.

Some of these methods may have streaming and non-streaming variants, but a streaming method will always have a `Streaming` suffix in its name, even if it doesn't have a non-streaming variant.

These streaming methods return [`StreamResponse`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/core/http/StreamResponse.kt) for synchronous clients:

```java
import com.browserbase.api.core.http.StreamResponse;
import com.browserbase.api.models.sessions.StreamEvent;

try (StreamResponse<StreamEvent> streamResponse = client.sessions().actStreaming(params)) {
    streamResponse.stream().forEach(chunk -> {
        System.out.println(chunk);
    });
    System.out.println("No more chunks!");
}
```

Or [`AsyncStreamResponse`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/core/http/AsyncStreamResponse.kt) for asynchronous clients:

```java
import com.browserbase.api.core.http.AsyncStreamResponse;
import com.browserbase.api.models.sessions.StreamEvent;
import java.util.Optional;

client.async().sessions().actStreaming(params).subscribe(chunk -> {
    System.out.println(chunk);
});

// If you need to handle errors or completion of the stream
client.async().sessions().actStreaming(params).subscribe(new AsyncStreamResponse.Handler<>() {
    @Override
    public void onNext(StreamEvent chunk) {
        System.out.println(chunk);
    }

    @Override
    public void onComplete(Optional<Throwable> error) {
        if (error.isPresent()) {
            System.out.println("Something went wrong!");
            throw new RuntimeException(error.get());
        } else {
            System.out.println("No more chunks!");
        }
    }
});

// Or use futures
client.async().sessions().actStreaming(params)
    .subscribe(chunk -> {
        System.out.println(chunk);
    })
    .onCompleteFuture();
    .whenComplete((unused, error) -> {
        if (error != null) {
            System.out.println("Something went wrong!");
            throw new RuntimeException(error);
        } else {
            System.out.println("No more chunks!");
        }
    });
```

Async streaming uses a dedicated per-client cached thread pool [`Executor`](https://docs.oracle.com/javase/8/docs/api/java/util/concurrent/Executor.html) to stream without blocking the current thread. This default is suitable for most purposes.

To use a different `Executor`, configure the subscription using the `executor` parameter:

```java
import java.util.concurrent.Executor;
import java.util.concurrent.Executors;

Executor executor = Executors.newFixedThreadPool(4);
client.async().sessions().actStreaming(params).subscribe(
    chunk -> System.out.println(chunk), executor
);
```

Or configure the client globally using the `streamHandlerExecutor` method:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;
import java.util.concurrent.Executors;

StagehandClient client = StagehandOkHttpClient.builder()
    .fromEnv()
    .streamHandlerExecutor(Executors.newFixedThreadPool(4))
    .build();
```

## Raw responses

The SDK defines methods that deserialize responses into instances of Java classes. However, these methods don't provide access to the response headers, status code, or the raw response body.

To access this data, prefix any HTTP method call on a client or service with `withRawResponse()`:

```java
import com.browserbase.api.core.http.Headers;
import com.browserbase.api.core.http.HttpResponseFor;
import com.browserbase.api.models.sessions.SessionStartParams;
import com.browserbase.api.models.sessions.SessionStartResponse;

SessionStartParams params = SessionStartParams.builder()
    .modelName("openai/gpt-5-nano")
    .build();
HttpResponseFor<SessionStartResponse> response = client.sessions().withRawResponse().start(params);

int statusCode = response.statusCode();
Headers headers = response.headers();
```

You can still deserialize the response into an instance of a Java class if needed:

```java
import com.browserbase.api.models.sessions.SessionStartResponse;

SessionStartResponse parsedResponse = response.parse();
```

## Error handling

The SDK throws custom unchecked exception types:

- [`StagehandServiceException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/StagehandServiceException.kt): Base class for HTTP errors. See this table for which exception subclass is thrown for each HTTP status code:

  | Status | Exception                                                                                                                          |
  | ------ | ---------------------------------------------------------------------------------------------------------------------------------- |
  | 400    | [`BadRequestException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/BadRequestException.kt)                     |
  | 401    | [`UnauthorizedException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/UnauthorizedException.kt)                 |
  | 403    | [`PermissionDeniedException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/PermissionDeniedException.kt)         |
  | 404    | [`NotFoundException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/NotFoundException.kt)                         |
  | 422    | [`UnprocessableEntityException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/UnprocessableEntityException.kt)   |
  | 429    | [`RateLimitException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/RateLimitException.kt)                       |
  | 5xx    | [`InternalServerException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/InternalServerException.kt)             |
  | others | [`UnexpectedStatusCodeException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/UnexpectedStatusCodeException.kt) |

  [`SseException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/SseException.kt) is thrown for errors encountered during [SSE streaming](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events) after a successful initial HTTP response.

- [`StagehandIoException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/StagehandIoException.kt): I/O networking errors.

- [`StagehandRetryableException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/StagehandRetryableException.kt): Generic error indicating a failure that could be retried by the client.

- [`StagehandInvalidDataException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/StagehandInvalidDataException.kt): Failure to interpret successfully parsed data. For example, when accessing a property that's supposed to be required, but the API unexpectedly omitted it from the response.

- [`StagehandException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/StagehandException.kt): Base class for all exceptions. Most errors will result in one of the previously mentioned ones, but completely generic errors may be thrown using the base class.

## Logging

The SDK uses the standard [OkHttp logging interceptor](https://github.com/square/okhttp/tree/master/okhttp-logging-interceptor).

Enable logging by setting the `STAGEHAND_LOG` environment variable to `info`:

```sh
export STAGEHAND_LOG=info
```

Or to `debug` for more verbose logging:

```sh
export STAGEHAND_LOG=debug
```

## ProGuard and R8

Although the SDK uses reflection, it is still usable with [ProGuard](https://github.com/Guardsquare/proguard) and [R8](https://developer.android.com/topic/performance/app-optimization/enable-app-optimization) because `stagehand-java-core` is published with a [configuration file](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/resources/META-INF/proguard/stagehand-java-core.pro) containing [keep rules](https://www.guardsquare.com/manual/configuration/usage).

ProGuard and R8 should automatically detect and use the published rules, but you can also manually copy the keep rules if necessary.

## Jackson

The SDK depends on [Jackson](https://github.com/FasterXML/jackson) for JSON serialization/deserialization. It is compatible with version 2.13.4 or higher, but depends on version 2.18.2 by default.

The SDK throws an exception if it detects an incompatible Jackson version at runtime (e.g. if the default version was overridden in your Maven or Gradle config).

If the SDK threw an exception, but you're _certain_ the version is compatible, then disable the version check using the `checkJacksonVersionCompatibility` on [`StagehandOkHttpClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClient.kt) or [`StagehandOkHttpClientAsync`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClientAsync.kt).

> [!CAUTION]
> We make no guarantee that the SDK works correctly when the Jackson version check is disabled.

## Network options

### Retries

The SDK automatically retries 2 times by default, with a short exponential backoff between requests.

Only the following error types are retried:

- Connection errors (for example, due to a network connectivity problem)
- 408 Request Timeout
- 409 Conflict
- 429 Rate Limit
- 5xx Internal

The API may also explicitly instruct the SDK to retry or not retry a request.

To set a custom number of retries, configure the client using the `maxRetries` method:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;

StagehandClient client = StagehandOkHttpClient.builder()
    .fromEnv()
    .maxRetries(4)
    .build();
```

### Timeouts

Requests time out after 1 minute by default.

To set a custom timeout, configure the method call using the `timeout` method:

```java
import com.browserbase.api.models.sessions.SessionStartResponse;

SessionStartResponse response = client.sessions().start(
  params, RequestOptions.builder().timeout(Duration.ofSeconds(30)).build()
);
```

Or configure the default for all method calls at the client level:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;
import java.time.Duration;

StagehandClient client = StagehandOkHttpClient.builder()
    .fromEnv()
    .timeout(Duration.ofSeconds(30))
    .build();
```

### Proxies

To route requests through a proxy, configure the client using the `proxy` method:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;
import java.net.InetSocketAddress;
import java.net.Proxy;

StagehandClient client = StagehandOkHttpClient.builder()
    .fromEnv()
    .proxy(new Proxy(
      Proxy.Type.HTTP, new InetSocketAddress(
        "https://example.com", 8080
      )
    ))
    .build();
```

### HTTPS

> [!NOTE]
> Most applications should not call these methods, and instead use the system defaults. The defaults include
> special optimizations that can be lost if the implementations are modified.

To configure how HTTPS connections are secured, configure the client using the `sslSocketFactory`, `trustManager`, and `hostnameVerifier` methods:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;

StagehandClient client = StagehandOkHttpClient.builder()
    .fromEnv()
    // If `sslSocketFactory` is set, then `trustManager` must be set, and vice versa.
    .sslSocketFactory(yourSSLSocketFactory)
    .trustManager(yourTrustManager)
    .hostnameVerifier(yourHostnameVerifier)
    .build();
```

### Custom HTTP client

The SDK consists of three artifacts:

- `stagehand-java-core`
  - Contains core SDK logic
  - Does not depend on [OkHttp](https://square.github.io/okhttp)
  - Exposes [`StagehandClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClient.kt), [`StagehandClientAsync`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientAsync.kt), [`StagehandClientImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientImpl.kt), and [`StagehandClientAsyncImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientAsyncImpl.kt), all of which can work with any HTTP client
- `stagehand-java-client-okhttp`
  - Depends on [OkHttp](https://square.github.io/okhttp)
  - Exposes [`StagehandOkHttpClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClient.kt) and [`StagehandOkHttpClientAsync`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClientAsync.kt), which provide a way to construct [`StagehandClientImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientImpl.kt) and [`StagehandClientAsyncImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientAsyncImpl.kt), respectively, using OkHttp
- `stagehand-java`
  - Depends on and exposes the APIs of both `stagehand-java-core` and `stagehand-java-client-okhttp`
  - Does not have its own logic

This structure allows replacing the SDK's default HTTP client without pulling in unnecessary dependencies.

#### Customized [`OkHttpClient`](https://square.github.io/okhttp/3.x/okhttp/okhttp3/OkHttpClient.html)

> [!TIP]
> Try the available [network options](#network-options) before replacing the default client.

To use a customized `OkHttpClient`:

1. Replace your [`stagehand-java` dependency](#installation) with `stagehand-java-core`
2. Copy `stagehand-java-client-okhttp`'s [`OkHttpClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/OkHttpClient.kt) class into your code and customize it
3. Construct [`StagehandClientImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientImpl.kt) or [`StagehandClientAsyncImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientAsyncImpl.kt), similarly to [`StagehandOkHttpClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClient.kt) or [`StagehandOkHttpClientAsync`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClientAsync.kt), using your customized client

### Completely custom HTTP client

To use a completely custom HTTP client:

1. Replace your [`stagehand-java` dependency](#installation) with `stagehand-java-core`
2. Write a class that implements the [`HttpClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/core/http/HttpClient.kt) interface
3. Construct [`StagehandClientImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientImpl.kt) or [`StagehandClientAsyncImpl`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/client/StagehandClientAsyncImpl.kt), similarly to [`StagehandOkHttpClient`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClient.kt) or [`StagehandOkHttpClientAsync`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-client-okhttp/src/main/kotlin/com/browserbase/api/client/okhttp/StagehandOkHttpClientAsync.kt), using your new client class

## Undocumented API functionality

The SDK is typed for convenient usage of the documented API. However, it also supports working with undocumented or not yet supported parts of the API.

### Parameters

To set undocumented parameters, call the `putAdditionalHeader`, `putAdditionalQueryParam`, or `putAdditionalBodyProperty` methods on any `Params` class:

```java
import com.browserbase.api.core.JsonValue;
import com.browserbase.api.models.sessions.SessionActParams;

SessionActParams params = SessionActParams.builder()
    .putAdditionalHeader("Secret-Header", "42")
    .putAdditionalQueryParam("secret_query_param", "42")
    .putAdditionalBodyProperty("secretProperty", JsonValue.from("42"))
    .build();
```

These can be accessed on the built object later using the `_additionalHeaders()`, `_additionalQueryParams()`, and `_additionalBodyProperties()` methods.

To set undocumented parameters on _nested_ headers, query params, or body classes, call the `putAdditionalProperty` method on the nested class:

```java
import com.browserbase.api.core.JsonValue;
import com.browserbase.api.models.sessions.SessionActParams;

SessionActParams params = SessionActParams.builder()
    .options(SessionActParams.Options.builder()
        .putAdditionalProperty("secretProperty", JsonValue.from("42"))
        .build())
    .build();
```

These properties can be accessed on the nested built object later using the `_additionalProperties()` method.

To set a documented parameter or property to an undocumented or not yet supported _value_, pass a [`JsonValue`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/core/Values.kt) object to its setter:

```java
import com.browserbase.api.core.JsonValue;
import com.browserbase.api.models.sessions.SessionActParams;

SessionActParams params = SessionActParams.builder()
    .input(JsonValue.from(42))
    .build();
```

The most straightforward way to create a [`JsonValue`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/core/Values.kt) is using its `from(...)` method:

```java
import com.browserbase.api.core.JsonValue;
import java.util.List;
import java.util.Map;

// Create primitive JSON values
JsonValue nullValue = JsonValue.from(null);
JsonValue booleanValue = JsonValue.from(true);
JsonValue numberValue = JsonValue.from(42);
JsonValue stringValue = JsonValue.from("Hello World!");

// Create a JSON array value equivalent to `["Hello", "World"]`
JsonValue arrayValue = JsonValue.from(List.of(
  "Hello", "World"
));

// Create a JSON object value equivalent to `{ "a": 1, "b": 2 }`
JsonValue objectValue = JsonValue.from(Map.of(
  "a", 1,
  "b", 2
));

// Create an arbitrarily nested JSON equivalent to:
// {
//   "a": [1, 2],
//   "b": [3, 4]
// }
JsonValue complexValue = JsonValue.from(Map.of(
  "a", List.of(
    1, 2
  ),
  "b", List.of(
    3, 4
  )
));
```

Normally a `Builder` class's `build` method will throw [`IllegalStateException`](https://docs.oracle.com/javase/8/docs/api/java/lang/IllegalStateException.html) if any required parameter or property is unset.

To forcibly omit a required parameter or property, pass [`JsonMissing`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/core/Values.kt):

```java
import com.browserbase.api.core.JsonMissing;
import com.browserbase.api.models.sessions.SessionActParams;

SessionActParams params = SessionActParams.builder()
    .input("Click the login button")
    .id(JsonMissing.of())
    .build();
```

### Response properties

To access undocumented response properties, call the `_additionalProperties()` method:

```java
import com.browserbase.api.core.JsonValue;
import java.util.Map;

Map<String, JsonValue> additionalProperties = client.sessions().act(params)._additionalProperties();
JsonValue secretPropertyValue = additionalProperties.get("secretProperty");

String result = secretPropertyValue.accept(new JsonValue.Visitor<>() {
    @Override
    public String visitNull() {
        return "It's null!";
    }

    @Override
    public String visitBoolean(boolean value) {
        return "It's a boolean!";
    }

    @Override
    public String visitNumber(Number value) {
        return "It's a number!";
    }

    // Other methods include `visitMissing`, `visitString`, `visitArray`, and `visitObject`
    // The default implementation of each unimplemented method delegates to `visitDefault`, which throws by default, but can also be overridden
});
```

To access a property's raw JSON value, which may be undocumented, call its `_` prefixed method:

```java
import com.browserbase.api.core.JsonField;
import com.browserbase.api.models.sessions.SessionActParams;
import java.util.Optional;

JsonField<SessionActParams.Input> input = client.sessions().act(params)._input();

if (input.isMissing()) {
  // The property is absent from the JSON response
} else if (input.isNull()) {
  // The property was set to literal null
} else {
  // Check if value was provided as a string
  // Other methods include `asNumber()`, `asBoolean()`, etc.
  Optional<String> jsonString = input.asString();

  // Try to deserialize into a custom type
  MyClass myObject = input.asUnknown().orElseThrow().convert(MyClass.class);
}
```

### Response validation

In rare cases, the API may return a response that doesn't match the expected type. For example, the SDK may expect a property to contain a `String`, but the API could return something else.

By default, the SDK will not throw an exception in this case. It will throw [`StagehandInvalidDataException`](https://github.com/browserbase/stagehand-java/blob/main/stagehand-java-core/src/main/kotlin/com/browserbase/api/errors/StagehandInvalidDataException.kt) only if you directly access the property.

If you would prefer to check that the response is completely well-typed upfront, then either call `validate()`:

```java
import com.browserbase.api.models.sessions.SessionActResponse;

SessionActResponse response = client.sessions().act(params).validate();
```

Or configure the method call to validate the response using the `responseValidation` method:

```java
import com.browserbase.api.models.sessions.SessionActResponse;

SessionActResponse response = client.sessions().act(
  params, RequestOptions.builder().responseValidation(true).build()
);
```

Or configure the default for all method calls at the client level:

```java
import com.browserbase.api.client.StagehandClient;
import com.browserbase.api.client.okhttp.StagehandOkHttpClient;

StagehandClient client = StagehandOkHttpClient.builder()
    .fromEnv()
    .responseValidation(true)
    .build();
```

## FAQ

### Why don't you use plain `enum` classes?

Java `enum` classes are not trivially [forwards compatible](https://www.stainless.com/blog/making-java-enums-forwards-compatible). Using them in the SDK could cause runtime exceptions if the API is updated to respond with a new enum value.

### Why do you represent fields using `JsonField<T>` instead of just plain `T`?

Using `JsonField<T>` enables a few features:

- Allowing usage of [undocumented API functionality](#undocumented-api-functionality)
- Lazily [validating the API response against the expected shape](#response-validation)
- Representing absent vs explicitly null values

### Why don't you use [`data` classes](https://kotlinlang.org/docs/data-classes.html)?

It is not [backwards compatible to add new fields to a data class](https://kotlinlang.org/docs/api-guidelines-backward-compatibility.html#avoid-using-data-classes-in-your-api) and we don't want to introduce a breaking change every time we add a field to a class.

### Why don't you use checked exceptions?

Checked exceptions are widely considered a mistake in the Java programming language. In fact, they were omitted from Kotlin for this reason.

Checked exceptions:

- Are verbose to handle
- Encourage error handling at the wrong level of abstraction, where nothing can be done about the error
- Are tedious to propagate due to the [function coloring problem](https://journal.stuffwithstuff.com/2015/02/01/what-color-is-your-function)
- Don't play well with lambdas (also due to the function coloring problem)

## Semantic versioning

This package generally follows [SemVer](https://semver.org/spec/v2.0.0.html) conventions, though certain backwards-incompatible changes may be released as minor versions:

1. Changes to library internals which are technically public but not intended or documented for external use. _(Please open a GitHub issue to let us know if you are relying on such internals.)_
2. Changes that we do not expect to impact the vast majority of users in practice.

We take backwards-compatibility seriously and work hard to ensure you can rely on a smooth upgrade experience.

We are keen for your feedback; please open an [issue](https://www.github.com/browserbase/stagehand-java/issues) with questions, bugs, or suggestions.

================================================
FILE: packages/docs/v3/sdk/python.mdx
================================================
---
title: "Python SDK"
description: "Official Stagehand SDK for Python"
---

<Note>
  This documentation is automatically synced from the [Python SDK GitHub repository](https://github.com/browserbase/stagehand-python).
</Note>

<Note>
  Migrating from the old v2 Python SDK? See our [migration guide here](/v3/migrations/python).
</Note>

## What is Stagehand?

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## Why Stagehand?

Most existing browser automation tools either require you to write low-level code in a framework like Selenium, Playwright, or Puppeteer, or use high-level agents that can be unpredictable in production. By letting developers choose what to write in code vs. natural language (and bridging the gap between the two) Stagehand is the natural choice for browser automations in production.

1. **Choose when to write code vs. natural language**: use AI when you want to navigate unfamiliar pages, and use code when you know exactly what you want to do.

2. **Go from AI-driven to repeatable workflows**: Stagehand lets you preview AI actions before running them, and also helps you easily cache repeatable actions to save time and tokens.

3. **Write once, run forever**: Stagehand's auto-caching combined with self-healing remembers previous actions, runs without LLM inference, and knows when to involve AI whenever the website changes and your automation breaks.

## Installation

```sh
uv pip install stagehand
```

For local development or when working from this repository, sync the dependency lockfile with `uv` (see the Local development section below) before running project scripts.

## Requirements

Python 3.9 or higher.

## Running the Example

A complete working example is available at [`examples/full_example.py`](https://github.com/browserbase/stagehand-python/blob/main/examples/full_example.py).

To run it, first export the required environment variables, then use Python:

```bash
export BROWSERBASE_API_KEY="your-bb-api-key"
export BROWSERBASE_PROJECT_ID="your-bb-project-uuid"
export MODEL_API_KEY="sk-proj-your-llm-api-key"

uv run python examples/full_example.py
```

## Local mode example

If you want to run Stagehand locally, use the local example (`examples/local_example.py`). It shows how to configure the client for `server="local"`.

Local mode runs Stagehand’s embedded server and launches a **local Chrome/Chromium** browser (it is **not bundled** with the Python wheel), so you must have Chrome installed on the machine running the example.

If Chrome is installed but Stagehand can’t find it, set `CHROME_PATH` to your browser executable (or pass `browser.launchOptions.executablePath` when starting the session).

Common Windows paths:
- `C:\Program Files\Google\Chrome\Application\chrome.exe`
- `C:\Program Files (x86)\Google\Chrome\Application\chrome.exe`

PowerShell:

```powershell
# optional if you don't already have Chrome installed
winget install -e --id Google.Chrome

# optional if Stagehand can't auto-detect Chrome
$env:CHROME_PATH="C:\Program Files\Google\Chrome\Application\chrome.exe"

uv run python examples/local_example.py
```

```bash
uv pip install stagehand
uv run python examples/local_example.py
```

## Streaming logging example

See [`examples/logging_example.py`](https://github.com/browserbase/stagehand-python/blob/main/examples/logging_example.py) for a remote-only flow that streams `StreamEvent`s with `verbose=2`, `stream_response=True`, and `x_stream_response="true"` so you can watch the SDK’s logs as they arrive.

```bash
uv run python examples/logging_example.py
```

<details>
<summary><strong>Local development</strong></summary>

This repository relies on `uv` to install the sanctioned Python version and dependencies. After cloning, bootstrap the environment with:

```sh
./scripts/bootstrap
```
Once the environment is ready, execute repo scripts with `uv run`:

```sh
uv run python examples/full_example.py
```
</details>

## Usage

This example demonstrates the full Stagehand workflow: starting a session, navigating to a page, observing possible actions, acting on elements, extracting data, and running an autonomous agent.

```python
import asyncio

from stagehand import AsyncStagehand

async def main() -> None:
    # Create client using environment variables:
    # BROWSERBASE_API_KEY, BROWSERBASE_PROJECT_ID, MODEL_API_KEY
    client = AsyncStagehand()

    # Start a new browser session (returns a session helper bound to a session_id)
    session = await client.sessions.create(model_name="openai/gpt-5-nano")

    print(f"Session started: {session.id}")

    try:
        # Navigate to a webpage
        await session.navigate(
            url="https://news.ycombinator.com",
        )
        print("Navigated to Hacker News")

        # Observe to find possible actions on the page
        observe_response = await session.observe(
            instruction="find the link to view comments for the top post",
        )

        results = observe_response.data.result
        print(f"Found {len(results)} possible actions")
        if not results:
            return

        # Take the first action returned by Observe and pass it to Act
        action = results[0].to_dict(exclude_none=True)
        print("Acting on:", action.get("description"))

        act_response = await session.act(input=action)
        print("Act completed:", act_response.data.result.message)

        # Extract structured data from the page using a JSON schema
        extract_response = await session.extract(
            instruction="extract the text of the top comment on this page",
            schema={
                "type": "object",
                "properties": {
                    "commentText": {"type": "string"},
                    "author": {"type": "string"},
                },
                "required": ["commentText"],
            },
        )

        extracted = extract_response.data.result
        author = extracted.get("author", "unknown") if isinstance(extracted, dict) else "unknown"
        print("Extracted author:", author)

        # Run an autonomous agent to accomplish a complex task
        execute_response = await session.execute(
            execute_options={
                "instruction": f"Find any personal website, GitHub, or LinkedIn profile for the Hacker News user '{author}'.",
                "max_steps": 10,
            },
            agent_config={"model": "openai/gpt-5-nano"},
            timeout=300.0,
        )

        print("Agent completed:", execute_response.data.result.message)
        print("Agent success:", execute_response.data.result.success)
    finally:
        # End the browser session to clean up resources
        await session.end()
        print("Session ended")

if __name__ == "__main__":
    asyncio.run(main())
```

## Client configuration

Configure the client using environment variables:

```python
from stagehand import AsyncStagehand

client = AsyncStagehand()
```

Or manually:

```python
from stagehand import AsyncStagehand

client = AsyncStagehand(
    browserbase_api_key="My Browserbase API Key",
    browserbase_project_id="My Browserbase Project ID",
    model_api_key="My Model API Key",
)
```

Or using a combination of the two approaches:

```python
from stagehand import AsyncStagehand

client = AsyncStagehand(
    # Configures using environment variables
    browserbase_api_key="My Browserbase API Key",  # override just this one
)
```

See this table for the available options:

| Keyword argument         | Environment variable     | Required | Default value                             |
| ------------------------ | ------------------------ | -------- | ----------------------------------------- |
| `browserbase_api_key`    | `BROWSERBASE_API_KEY`    | true     | -                                         |
| `browserbase_project_id` | `BROWSERBASE_PROJECT_ID` | true     | -                                         |
| `model_api_key`          | `MODEL_API_KEY`          | true     | -                                         |
| `base_url`               | `STAGEHAND_BASE_URL`     | false    | `"https://api.stagehand.browserbase.com"` |

Keyword arguments take precedence over environment variables.

> [!TIP]
> Don't create more than one client in the same application. Each client has a connection pool, which is more efficient to share between requests.

### Modifying configuration

To temporarily use a modified client configuration while reusing the same connection pool, call `with_options()` on any client:

```python
client_with_options = client.with_options(model_api_key="sk-your-llm-api-key-here", max_retries=42)
```

The `with_options()` method does not affect the original client.

## Requests and responses

To send a request to the Stagehand API, call the corresponding client method using keyword arguments.

Nested request parameters are dictionaries typed using [`TypedDict`](https://docs.python.org/3/library/typing.html#typing.TypedDict). Responses are [Pydantic models](https://docs.pydantic.dev) which also provide helper methods like:

- Serializing back into JSON: `model.to_json()`
- Converting to a dictionary: `model.to_dict()`

## Immutability

Response objects are Pydantic models. If you want to build a modified copy, prefer `model.model_copy(update={...})` (Pydantic v2) rather than mutating in place.

## Asynchronous execution

This SDK recommends using `AsyncStagehand` and `await`ing each API call:

```python
import asyncio
from stagehand import AsyncStagehand

async def main() -> None:
    client = AsyncStagehand()
    session = await client.sessions.create(model_name="openai/gpt-5-nano")
    response = await session.act(input="click the first link on the page")
    print(response.data)

asyncio.run(main())
```

### With aiohttp

By default, the async client uses `httpx` for HTTP requests. For improved concurrency performance you may also use `aiohttp` as the HTTP backend.

Install `aiohttp`:

```sh
uv run pip install stagehand[aiohttp]
```

Then instantiate the client with `http_client=DefaultAioHttpClient()`:

```python
import asyncio
from stagehand import AsyncStagehand, DefaultAioHttpClient

async def main() -> None:
    async with AsyncStagehand(http_client=DefaultAioHttpClient()) as client:
        session = await client.sessions.create(model_name="openai/gpt-5-nano")
        response = await session.act(input="click the first link on the page")
        print(response.data)

asyncio.run(main())
```

## Streaming responses

We provide support for streaming responses using Server-Sent Events (SSE).

To enable SSE streaming, you must:

1. Ask the server to stream by setting `x_stream_response="true"` (header), and
2. Tell the client to parse an SSE stream by setting `stream_response=True`.

```python
import asyncio

from stagehand import AsyncStagehand

async def main() -> None:
    async with AsyncStagehand() as client:
        session = await client.sessions.create(model_name="openai/gpt-5-nano")

        stream = await client.sessions.act(
            id=session.id,
            input="click the first link on the page",
            stream_response=True,
            x_stream_response="true",
        )
        async for event in stream:
            # event is a StreamEvent (type: "system" | "log")
            print(event.type, event.data)

asyncio.run(main())
```

## Raw responses

The SDK defines methods that deserialize responses into Pydantic models. However, these methods don't provide access to response headers, status code, or the raw response body.

To access this data, prefix any HTTP method call on a client or service with `with_raw_response`:

```python
import asyncio

from stagehand import AsyncStagehand

async def main() -> None:
    async with AsyncStagehand() as client:
        response = await client.sessions.with_raw_response.start(model_name="openai/gpt-5-nano")
        print(response.headers.get("X-My-Header"))

        session = response.parse()  # get the object that `sessions.start()` would have returned
        print(session.data)

asyncio.run(main())
```

### `.with_streaming_response`

The `with_raw_response` interface eagerly reads the full response body when you make the request.

To stream the response body (not SSE), use `with_streaming_response` instead. It requires a context manager and only reads the response body once you call `.read()`, `.text()`, `.json()`, `.iter_bytes()`, `.iter_text()`, `.iter_lines()` or `.parse()`.

```python
import asyncio

from stagehand import AsyncStagehand

async def main() -> None:
    async with AsyncStagehand() as client:
        async with client.sessions.with_streaming_response.start(model_name="openai/gpt-5-nano") as response:
            print(response.headers.get("X-My-Header"))
            async for line in response.iter_lines():
                print(line)

asyncio.run(main())
```

## Error handling

When the library is unable to connect to the API (for example, due to network connection problems or a timeout), a subclass of `stagehand.APIConnectionError` is raised.

When the API returns a non-success status code (that is, 4xx or 5xx response), a subclass of `stagehand.APIStatusError` is raised, containing `status_code` and `response` properties.

All errors inherit from `stagehand.APIError`.

```python
import asyncio

import stagehand
from stagehand import AsyncStagehand

async def main() -> None:
    async with AsyncStagehand() as client:
        try:
            await client.sessions.start(model_name="openai/gpt-5-nano")
        except stagehand.APIConnectionError as e:
            print("The server could not be reached")
            print(e.__cause__)  # an underlying Exception, likely raised within httpx.
        except stagehand.RateLimitError:
            print("A 429 status code was received; we should back off a bit.")
        except stagehand.APIStatusError as e:
            print("A non-200-range status code was received")
            print(e.status_code)
            print(e.response)

asyncio.run(main())
```

Error codes are as follows:

| Status Code | Error Type                 |
| ----------- | -------------------------- |
| 400         | `BadRequestError`          |
| 401         | `AuthenticationError`      |
| 403         | `PermissionDeniedError`    |
| 404         | `NotFoundError`            |
| 422         | `UnprocessableEntityError` |
| 429         | `RateLimitError`           |
| >=500       | `InternalServerError`      |
| N/A         | `APIConnectionError`       |

### Retries

Certain errors are automatically retried 2 times by default, with a short exponential backoff. Connection errors (for example, due to a network connectivity problem), 408 Request Timeout, 409 Conflict, 429 Rate Limit, and >=500 Internal errors are all retried by default.

You can use the `max_retries` option to configure or disable retry settings:

```python
import asyncio

from stagehand import AsyncStagehand

async def main() -> None:
    async with AsyncStagehand(max_retries=0) as client:
        # Or, configure per-request:
        await client.with_options(max_retries=5).sessions.start(model_name="openai/gpt-5-nano")

asyncio.run(main())
```

### Timeouts

By default requests time out after 1 minute. You can configure this with a `timeout` option, which accepts a float or an [`httpx.Timeout`](https://www.python-httpx.org/advanced/timeouts/#fine-tuning-the-configuration) object.

On timeout, an `APITimeoutError` is thrown. Note that requests that time out are [retried twice by default](#retries).

## Logging

The SDK uses the standard library [`logging`](https://docs.python.org/3/library/logging.html) module.

Enable logging by setting the `STAGEHAND_LOG` environment variable to `info`:

```sh
export STAGEHAND_LOG=info
```

Or to `debug` for more verbose logging:

```sh
export STAGEHAND_LOG=debug
```

## Undocumented API functionality

This library is typed for convenient access to the documented API, but you can still access undocumented endpoints, request params, or response properties when needed.

### Undocumented endpoints

To make requests to undocumented endpoints, use `client.get`, `client.post`, and other HTTP verbs. Client options (such as retries) are respected.

```python
import httpx
from stagehand import AsyncStagehand

import asyncio

async def main() -> None:
    async with AsyncStagehand() as client:
        response = await client.post("/foo", cast_to=httpx.Response, body={"my_param": True})
        print(response.headers.get("x-foo"))

asyncio.run(main())
```

### Undocumented request params

To send extra params that aren't available as keyword args, use `extra_query`, `extra_body`, and `extra_headers`.

### Undocumented response properties

To access undocumented response properties, you can access extra fields like `response.unknown_prop`. You can also get all extra fields as a dict with [`response.model_extra`](https://docs.pydantic.dev/latest/api/base_model/#pydantic.BaseModel.model_extra).

## Response validation

In rare cases, the API may return a response that doesn't match the expected type.

By default, the SDK is permissive and will only raise an error if you later try to use the invalid data.

If you would prefer to validate responses upfront, instantiate the client with `_strict_response_validation=True`. An `APIResponseValidationError` will be raised if the API responds with invalid data for the expected schema.

```python
import asyncio

from stagehand import APIResponseValidationError, AsyncStagehand

try:
    async def main() -> None:
        async with AsyncStagehand(_strict_response_validation=True) as client:
            await client.sessions.start(model_name="openai/gpt-5-nano")

    asyncio.run(main())
except APIResponseValidationError as e:
    print("Response failed schema validation:", e)
```

## FAQ

### Why are some values typed as `Literal[...]` instead of Python `Enum`s?

Using `Literal[...]` types is forwards compatible: the API can introduce new enum values without breaking older SDKs at runtime.

### How can I tell whether `None` means `null` or “missing” in a response?

In an API response, a field may be explicitly `null`, or missing entirely; in either case its value is `None` in this library. You can differentiate the two cases with `.model_fields_set`:

```python
if response.my_field is None:
    if "my_field" not in response.model_fields_set:
        print('Got json like {}, without a "my_field" key present at all.')
    else:
        print('Got json like {"my_field": null}.')
```

## Semantic versioning

This package generally follows [SemVer](https://semver.org/spec/v2.0.0.html) conventions, though certain backwards-incompatible changes may be released as minor versions:

1. Changes that only affect static types, without breaking runtime behavior.
2. Changes to library internals which are technically public but not intended or documented for external use. _(Please open a GitHub issue to let us know if you are relying on such internals.)_
3. Changes that we do not expect to impact the vast majority of users in practice.

We take backwards-compatibility seriously and work hard to ensure you can rely on a smooth upgrade experience.

We are keen for your feedback; please open an [issue](https://www.github.com/browserbase/stagehand-python/issues) with questions, bugs, or suggestions.

### Determining the installed version

If you've upgraded to the latest version but aren't seeing any new features you were expecting then your python environment is likely still using an older version.

You can determine the version that is being used at runtime with:

```python
import stagehand

print(stagehand.__version__)
```

================================================
FILE: packages/docs/v3/sdk/ruby.mdx
================================================
---
title: "Ruby SDK"
description: "Official Stagehand SDK for Ruby"
---

<Note>
  This documentation is automatically synced from the [Ruby SDK GitHub repository](https://github.com/browserbase/stagehand-ruby).
</Note>

## What is Stagehand?

Stagehand is a browser automation framework used to control web browsers with natural language and code. By combining the power of AI with the precision of code, Stagehand makes web automation flexible, maintainable, and actually reliable.

## Why Stagehand?

Most existing browser automation tools either require you to write low-level code in a framework like Selenium, Playwright, or Puppeteer, or use high-level agents that can be unpredictable in production. By letting developers choose what to write in code vs. natural language (and bridging the gap between the two) Stagehand is the natural choice for browser automations in production.

1. **Choose when to write code vs. natural language**: use AI when you want to navigate unfamiliar pages, and use code when you know exactly what you want to do.

2. **Go from AI-driven to repeatable workflows**: Stagehand lets you preview AI actions before running them, and also helps you easily cache repeatable actions to save time and tokens.

3. **Write once, run forever**: Stagehand's auto-caching combined with self-healing remembers previous actions, runs without LLM inference, and knows when to involve AI whenever the website changes and your automation breaks.

## Installation

To use this gem, install via Bundler by adding the following to your application's `Gemfile`:

```ruby
gem "stagehand", "~> 0.6.2"
```

## Usage

```ruby
require "bundler/setup"
require "stagehand"

# Create a new Stagehand client with your credentials
client = Stagehand::Client.new(
  browserbase_api_key: ENV["BROWSERBASE_API_KEY"],      # defaults to ENV["BROWSERBASE_API_KEY"]
  browserbase_project_id: ENV["BROWSERBASE_PROJECT_ID"], # defaults to ENV["BROWSERBASE_PROJECT_ID"]
  model_api_key: ENV["MODEL_API_KEY"]                   # defaults to ENV["MODEL_API_KEY"]
)

# Start a new browser session
start_response = client.sessions.start(
  model_name: "openai/gpt-5-nano"
)
puts "Session started: #{start_response.data.session_id}"

session_id = start_response.data.session_id

# Navigate to a webpage
client.sessions.navigate(
  session_id,
  url: "https://news.ycombinator.com"
)
puts "Navigated to Hacker News"

# Use Observe to find possible actions on the page
observe_response = client.sessions.observe(
  session_id,
  instruction: "find the link to view comments for the top post"
)

actions = observe_response.data.result
puts "Found #{actions.length} possible actions"

# Take the first action returned by Observe
action = actions.first
puts "Acting on: #{action.description}"

# Pass the structured action to Act
# Convert the observe result to a hash and ensure method is set to "click"
act_response = client.sessions.act(
  session_id,
  input: action.to_h.merge(method: "click")
)
puts "Act completed: #{act_response.data.result[:message]}"

# Extract data from the page
# We're now on the comments page, so extract the top comment text
extract_response = client.sessions.extract(
  session_id,
  instruction: "extract the text of the top comment on this page",
  schema: {
    type: "object",
    properties: {
      comment_text: {
        type: "string",
        description: "The text content of the top comment"
      },
      author: {
        type: "string",
        description: "The username of the comment author"
      }
    },
    required: ["comment_text"]
  }
)
puts "Extracted data: #{extract_response.data.result}"

# Get the author from the extracted data
extracted_data = extract_response.data.result
author = extracted_data[:author]
puts "Looking up profile for author: #{author}"

# Use the Agent to find the author's profile
# Execute runs an autonomous agent that can navigate and interact with pages
execute_response = client.sessions.execute(
  session_id,
  execute_options: {
    instruction: "Find any personal website, GitHub, LinkedIn, or other best profile URL for the Hacker News user '#{author}'. " \
                 "Click on their username to go to their profile page and look for any links they have shared.",
    max_steps: 15
  },
  agent_config: {
    model: Stagehand::ModelConfig::ModelConfigObject.new(
      model_name: "openai/gpt-5-nano",
      api_key: ENV["MODEL_API_KEY"]
    ),
    cua: false
  }
)
puts "Agent completed: #{execute_response.data.result[:message]}"
puts "Agent success: #{execute_response.data.result[:success]}"
puts "Agent actions taken: #{execute_response.data.result[:actions]&.length || 0}"

# End the session to cleanup browser resources
client.sessions.end_(session_id)
puts "Session ended"
```

### Running the Example

Set the required environment variables and run the example script:

```bash
# Set your credentials
export BROWSERBASE_API_KEY="your-browserbase-api-key"
export BROWSERBASE_PROJECT_ID="your-browserbase-project-id"
export MODEL_API_KEY="your-openai-api-key"

# Install dependencies and run
bundle install
bundle exec ruby examples/basic.rb
```

### Streaming

We provide support for streaming responses using Server-Sent Events (SSE).

```ruby
stream = stagehand.sessions.act_streaming(
  "00000000-your-session-id-000000000000",
  input: "click the first link on the page"
)

stream.each do |session|
  puts(session.data)
end
```

### Handling errors

When the library is unable to connect to the API, or if the API returns a non-success status code (i.e., 4xx or 5xx response), a subclass of `Stagehand::Errors::APIError` will be thrown:

```ruby
begin
  session = stagehand.sessions.start(model_name: "openai/gpt-5-nano")
rescue Stagehand::Errors::APIConnectionError => e
  puts("The server could not be reached")
  puts(e.cause)  # an underlying Exception, likely raised within `net/http`
rescue Stagehand::Errors::RateLimitError => e
  puts("A 429 status code was received; we should back off a bit.")
rescue Stagehand::Errors::APIStatusError => e
  puts("Another non-200-range status code was received")
  puts(e.status)
end
```

Error codes are as follows:

| Cause            | Error Type                 |
| ---------------- | -------------------------- |
| HTTP 400         | `BadRequestError`          |
| HTTP 401         | `AuthenticationError`      |
| HTTP 403         | `PermissionDeniedError`    |
| HTTP 404         | `NotFoundError`            |
| HTTP 409         | `ConflictError`            |
| HTTP 422         | `UnprocessableEntityError` |
| HTTP 429         | `RateLimitError`           |
| HTTP >= 500      | `InternalServerError`      |
| Other HTTP error | `APIStatusError`           |
| Timeout          | `APITimeoutError`          |
| Network error    | `APIConnectionError`       |

### Retries

Certain errors will be automatically retried 2 times by default, with a short exponential backoff.

Connection errors (for example, due to a network connectivity problem), 408 Request Timeout, 409 Conflict, 429 Rate Limit, >=500 Internal errors, and timeouts will all be retried by default.

You can use the `max_retries` option to configure or disable this:

```ruby
# Configure the default for all requests:
stagehand = Stagehand::Client.new(
  max_retries: 0 # default is 2
)

# Or, configure per-request:
stagehand.sessions.start(model_name: "openai/gpt-5-nano", request_options: {max_retries: 5})
```

### Timeouts

By default, requests will time out after 60 seconds. You can use the timeout option to configure or disable this:

```ruby
# Configure the default for all requests:
stagehand = Stagehand::Client.new(
  timeout: nil # default is 60
)

# Or, configure per-request:
stagehand.sessions.start(model_name: "openai/gpt-5-nano", request_options: {timeout: 5})
```

On timeout, `Stagehand::Errors::APITimeoutError` is raised.

Note that requests that time out are retried by default.

## Advanced concepts

### BaseModel

All parameter and response objects inherit from `Stagehand::Internal::Type::BaseModel`, which provides several conveniences, including:

1. All fields, including unknown ones, are accessible with `obj[:prop]` syntax, and can be destructured with `obj => {prop: prop}` or pattern-matching syntax.

2. Structural equivalence for equality; if two API calls return the same values, comparing the responses with == will return true.

3. Both instances and the classes themselves can be pretty-printed.

4. Helpers such as `#to_h`, `#deep_to_h`, `#to_json`, and `#to_yaml`.

### Making custom or undocumented requests

#### Undocumented properties

You can send undocumented parameters to any endpoint, and read undocumented response properties, like so:

Note: the `extra_` parameters of the same name overrides the documented parameters.

```ruby
response =
  stagehand.sessions.start(
    model_name: "openai/gpt-5-nano",
    request_options: {
      extra_query: {my_query_parameter: value},
      extra_body: {my_body_parameter: value},
      extra_headers: {"my-header": value}
    }
  )

puts(response[:my_undocumented_property])
```

#### Undocumented request params

If you want to explicitly send an extra param, you can do so with the `extra_query`, `extra_body`, and `extra_headers` under the `request_options:` parameter when making a request, as seen in the examples above.

#### Undocumented endpoints

To make requests to undocumented endpoints while retaining the benefit of auth, retries, and so on, you can make requests using `client.request`, like so:

```ruby
response = client.request(
  method: :post,
  path: '/undocumented/endpoint',
  query: {"dog": "woof"},
  headers: {"useful-header": "interesting-value"},
  body: {"hello": "world"}
)
```

### Concurrency & connection pooling

The `Stagehand::Client` instances are threadsafe, but are only are fork-safe when there are no in-flight HTTP requests.

Each instance of `Stagehand::Client` has its own HTTP connection pool with a default size of 99. As such, we recommend instantiating the client once per application in most settings.

When all available connections from the pool are checked out, requests wait for a new connection to become available, with queue time counting towards the request timeout.

Unless otherwise specified, other classes in the SDK do not have locks protecting their underlying data structure.

## Sorbet

This library provides comprehensive [RBI](https://sorbet.org/docs/rbi) definitions, and has no dependency on sorbet-runtime.

You can provide typesafe request parameters like so:

```ruby
stagehand.sessions.act("00000000-your-session-id-000000000000", input: "click the first link on the page")
```

Or, equivalently:

```ruby
# Hashes work, but are not typesafe:
stagehand.sessions.act("00000000-your-session-id-000000000000", input: "click the first link on the page")

# You can also splat a full Params class:
params = Stagehand::SessionActParams.new(input: "click the first link on the page")
stagehand.sessions.act("00000000-your-session-id-000000000000", **params)
```

### Enums

Since this library does not depend on `sorbet-runtime`, it cannot provide [`T::Enum`](https://sorbet.org/docs/tenum) instances. Instead, we provide "tagged symbols" instead, which is always a primitive at runtime:

```ruby
# :typescript
puts(Stagehand::SessionActParams::XLanguage::TYPESCRIPT)

# Revealed type: `T.all(Stagehand::SessionActParams::XLanguage, Symbol)`
T.reveal_type(Stagehand::SessionActParams::XLanguage::TYPESCRIPT)
```

Enum parameters have a "relaxed" type, so you can either pass in enum constants or their literal value:

```ruby
# Using the enum constants preserves the tagged type information:
stagehand.sessions.act(
  x_language: Stagehand::SessionActParams::XLanguage::TYPESCRIPT,
  # …
)

# Literal values are also permissible:
stagehand.sessions.act(
  x_language: :typescript,
  # …
)
```

## Versioning

This package follows [SemVer](https://semver.org/spec/v2.0.0.html) conventions. As the library is in initial development and has a major version of `0`, APIs may change at any time.

This package considers improvements to the (non-runtime) `*.rbi` and `*.rbs` type definitions to be non-breaking changes.

## Requirements

Ruby 3.2.0 or higher.

## Contributing

See [the contributing documentation](https://github.com/browserbase/stagehand-ruby/tree/main/CONTRIBUTING.md).

================================================
FILE: packages/evals/CHANGELOG.md
================================================
# @browserbasehq/stagehand-evals

## 1.1.9

### Patch Changes

- Updated dependencies [[`505e8c6`](https://github.com/browserbase/stagehand/commit/505e8c6736f3706328dbc8df670c49a018058388), [`2f43ffa`](https://github.com/browserbase/stagehand/commit/2f43ffac11778152d17e4c44405770cc32c3ec8c), [`63ee247`](https://github.com/browserbase/stagehand/commit/63ee247ac6bf2992046d4f6b2759f46b15643e36), [`7dc35f5`](https://github.com/browserbase/stagehand/commit/7dc35f5e25689e6518d68b25ef71536d2781c8aa), [`335cf47`](https://github.com/browserbase/stagehand/commit/335cf4730e73bce33e92331d04bda4b0fd42685d), [`6ba0a1d`](https://github.com/browserbase/stagehand/commit/6ba0a1db7fc2d5d5a2f8927b1417d8f1d15eda10), [`4ff3bb8`](https://github.com/browserbase/stagehand/commit/4ff3bb831a6ef6e2d57148e7afb68ea8d23e395d), [`c27054b`](https://github.com/browserbase/stagehand/commit/c27054bbd0508431ade91d655f89efc87bbf5867), [`2abf5b9`](https://github.com/browserbase/stagehand/commit/2abf5b90f1e2bb1442509ef3a686b6128c9cdcf6), [`7817fcc`](https://github.com/browserbase/stagehand/commit/7817fcc315eee4455ce04567cf56c9ec801caf0b), [`7390508`](https://github.com/browserbase/stagehand/commit/73905088c5ed5923d276da9cce2efd0a0a3a46eb), [`611f43a`](https://github.com/browserbase/stagehand/commit/611f43ac8d4c580216d55d2b217c14a9a9c11013), [`521a10e`](https://github.com/browserbase/stagehand/commit/521a10e3698fc5631e219947bc90dad0f8bddaa8), [`2402a3c`](https://github.com/browserbase/stagehand/commit/2402a3c4d50270391b3e6440f4385cdcf5e1eb64)]:
  - @browserbasehq/stagehand@3.2.0

## 1.1.8

### Patch Changes

- Updated dependencies [[`7584f3e`](https://github.com/browserbase/stagehand/commit/7584f3e92e60a557d2b3e0e0d2a2af04c3527523), [`1e1c9c1`](https://github.com/browserbase/stagehand/commit/1e1c9c15773e49d5c3cd36021dbc1d23495c1bce), [`6bef890`](https://github.com/browserbase/stagehand/commit/6bef89090ebd231e77d8092b2c32a0f06303d5a9), [`ffd4b33`](https://github.com/browserbase/stagehand/commit/ffd4b335a873d0f4dcd76ea22d44f47919bf8e49), [`677bff5`](https://github.com/browserbase/stagehand/commit/677bff5834c879a2d95f7dbff918b8e1510516b3), [`65ff464`](https://github.com/browserbase/stagehand/commit/65ff464bc13388eb109eba0a2cf533c1cc202854), [`101bcf2`](https://github.com/browserbase/stagehand/commit/101bcf2da8b527fd6ace6aa291ada5d0f2d90344), [`0a94301`](https://github.com/browserbase/stagehand/commit/0a94301caa991d1aa4cdade6e28a065b1aefb3e2), [`b27c04d`](https://github.com/browserbase/stagehand/commit/b27c04d278c290364347acd0c354a878ea9b7c2d), [`afbd08b`](https://github.com/browserbase/stagehand/commit/afbd08bb6367a9c9f65f67e453667987e4659918), [`e3db9aa`](https://github.com/browserbase/stagehand/commit/e3db9aa863f44270792215801fe6e3a02a1321aa), [`0e8d569`](https://github.com/browserbase/stagehand/commit/0e8d5695f662040f7384e64f46301152802e3c62), [`ff0f979`](https://github.com/browserbase/stagehand/commit/ff0f9795f3b2c1cf4f2610a80ebcb3341a24f987), [`2d89d2b`](https://github.com/browserbase/stagehand/commit/2d89d2b35ce812431956b28e0c8b52d32ddc7a27), [`aac9a19`](https://github.com/browserbase/stagehand/commit/aac9a19bdfbe62e4508631337ab0bfbcf8ae62b2), [`06de50f`](https://github.com/browserbase/stagehand/commit/06de50ff377fd31f1b0fcf79adb996d04562d2c0), [`aa4d981`](https://github.com/browserbase/stagehand/commit/aa4d981e440bdd0e3d3f42ccc310d5958aa25cc6), [`18b1e3b`](https://github.com/browserbase/stagehand/commit/18b1e3bd2b16b721845d52fcf1a45c6158e2403f), [`957d82b`](https://github.com/browserbase/stagehand/commit/957d82b9845b4413b123539e81a2e4a490e74a8a), [`b65756e`](https://github.com/browserbase/stagehand/commit/b65756e9e85643055446aa4a51956f7d6627c89f), [`22e371a`](https://github.com/browserbase/stagehand/commit/22e371ae4c25deb6350328fe02832bf2b2197b94), [`d29b91f`](https://github.com/browserbase/stagehand/commit/d29b91fa506636ca36f724fcf106320de54ec3f3), [`7b4f817`](https://github.com/browserbase/stagehand/commit/7b4f817cafb9829ac81c4b5890c318c7f9521fe4), [`176d420`](https://github.com/browserbase/stagehand/commit/176d42002cc0a2c7d13b4c0ffbbd56b70fdc49e8), [`3f9ca4d`](https://github.com/browserbase/stagehand/commit/3f9ca4d9acc109101357378d29cf969168991608), [`8a3c066`](https://github.com/browserbase/stagehand/commit/8a3c06600a9ba98485db7e9ed5c3cc43ea180334), [`49ead1e`](https://github.com/browserbase/stagehand/commit/49ead1e1e8678a8da0f87ad2042491dacc6b01d7), [`3673369`](https://github.com/browserbase/stagehand/commit/36733691f90c15386cf2a7b47d04ef429b7195ae), [`c465e87`](https://github.com/browserbase/stagehand/commit/c465e87ab41942435132c76338518fb3fa8e7896), [`ae533e4`](https://github.com/browserbase/stagehand/commit/ae533e40195181b53833f8055b1259fb360a927b), [`ea33052`](https://github.com/browserbase/stagehand/commit/ea330520a325583b71b87d85beb740df4bdb9b2d), [`5764ede`](https://github.com/browserbase/stagehand/commit/5764edee7aab00ef1aafafb68fc56eb26c0a70b2), [`f09b184`](https://github.com/browserbase/stagehand/commit/f09b184cc5e774736280ae8c94ba3f4f13adda80), [`a7d29de`](https://github.com/browserbase/stagehand/commit/a7d29decee0f7d12e2437267b9eef1795d3b4e3a), [`d334399`](https://github.com/browserbase/stagehand/commit/d3343990041bf9cd5613569840afb0c17131e33c), [`44416da`](https://github.com/browserbase/stagehand/commit/44416da7ff33301bb32d3811e6c3be8782a7d168), [`bdd8b4e`](https://github.com/browserbase/stagehand/commit/bdd8b4ee3c697a02728375510ab7fae764990576)]:
  - @browserbasehq/stagehand@3.1.0

## 1.1.7

### Patch Changes

- Updated dependencies [[`40ce5cc`](https://github.com/browserbase/stagehand/commit/40ce5cc83ec758f4e8c37132a7f4ac8eeea7ca34), [`5506f41`](https://github.com/browserbase/stagehand/commit/5506f416d2609d112b553263984e21d7a30e32b1), [`84c05ca`](https://github.com/browserbase/stagehand/commit/84c05ca8de4587181faf128e5c7464fd960caacc), [`692ffa0`](https://github.com/browserbase/stagehand/commit/692ffa0346ad3d121686aba503c0a22844293efa), [`1ef8901`](https://github.com/browserbase/stagehand/commit/1ef8901e1314e90f43b36be20192e652d3b5598f), [`72ac775`](https://github.com/browserbase/stagehand/commit/72ac775a831d6f0f376ceda4426525f93cc21452), [`3d5af07`](https://github.com/browserbase/stagehand/commit/3d5af07f66d6d26d1f5ac4bd9be7183c3381dd92), [`40e1d80`](https://github.com/browserbase/stagehand/commit/40e1d80776b9216422a25a81070ccb3105e56ec2), [`56c0d24`](https://github.com/browserbase/stagehand/commit/56c0d244f9b2431218bfa832ddfc0587930ae038), [`16d72fb`](https://github.com/browserbase/stagehand/commit/16d72fb4c4081dd33bf45605d75c27644ea4c00e), [`088c4cc`](https://github.com/browserbase/stagehand/commit/088c4cc31dc924bb232a9d5a09ab42cd961c2d36), [`4276f4a`](https://github.com/browserbase/stagehand/commit/4276f4abc8bbde215faac6c0321bf243484c376b), [`6005786`](https://github.com/browserbase/stagehand/commit/600578637e65f6fd18b0cdb322b9e0b857708b2f), [`6fbf5fc`](https://github.com/browserbase/stagehand/commit/6fbf5fc811e5e5d9d22f10c5309fbd336892263a), [`704cf18`](https://github.com/browserbase/stagehand/commit/704cf18cb2bdd187ba06c35f05ccb47317a7668c), [`091296e`](https://github.com/browserbase/stagehand/commit/091296e438bb2374c8bb10ef6c08283978145ebf), [`e56c6eb`](https://github.com/browserbase/stagehand/commit/e56c6eb139bf3aad37e98b16626fff13a6c671d0), [`2cb78d0`](https://github.com/browserbase/stagehand/commit/2cb78d0f5ddef9f7337a9a2fe3137f1421df700a), [`5dad639`](https://github.com/browserbase/stagehand/commit/5dad63938f08d968d434bb1ee2804f1e54fb836a), [`b7c2571`](https://github.com/browserbase/stagehand/commit/b7c2571ad4ac563f3ca0518e1f29a40da93e33bc), [`4c69117`](https://github.com/browserbase/stagehand/commit/4c6911748953199dc9aad3eabe98bcf325f871e4)]:
  - @browserbasehq/stagehand@3.0.8

## 1.1.6

### Patch Changes

- [#1373](https://github.com/browserbase/stagehand/pull/1373) [`cadd192`](https://github.com/browserbase/stagehand/commit/cadd192066c8aa5d19bb4d5daa630ed5981b5d7e) Thanks [@tkattkat](https://github.com/tkattkat)! - Update screenshot collector in agent evals cli

- Updated dependencies [[`0f3991e`](https://github.com/browserbase/stagehand/commit/0f3991eedc0aaff72ef718dda3ddb0839cf4a464), [`e0e22e0`](https://github.com/browserbase/stagehand/commit/e0e22e06bc752a8ffde30f3dbfa58d91e24e6c09), [`f261051`](https://github.com/browserbase/stagehand/commit/f2610517d74774374de9ee93191e663439ef55e5), [`e021674`](https://github.com/browserbase/stagehand/commit/e021674f9641c1c5f9d0c1817c3fdf599eea124d), [`6a5496f`](https://github.com/browserbase/stagehand/commit/6a5496f17dbb716be1ee1aaa4e5ba9d8c723b30b), [`fea1700`](https://github.com/browserbase/stagehand/commit/fea1700552af3319052f463685752501c8e71de3), [`5b288d9`](https://github.com/browserbase/stagehand/commit/5b288d9ac37406ff22460ac8050bea26b87a378e), [`e822f5a`](https://github.com/browserbase/stagehand/commit/e822f5a8898df9eb48ca32c321025f0c74b638f0), [`638efc7`](https://github.com/browserbase/stagehand/commit/638efc7fea401bc43dd05dceedf4c13a3495a728), [`a890f16`](https://github.com/browserbase/stagehand/commit/a890f16fa3a752f308f858e5ab9c9a0faf6b3b34), [`934f492`](https://github.com/browserbase/stagehand/commit/934f492ec587bef81f0ce75b45a35b44ab545712), [`bd2db92`](https://github.com/browserbase/stagehand/commit/bd2db925f66a826d61d58be1611d55646cbdb560), [`51e0170`](https://github.com/browserbase/stagehand/commit/51e01709ce1c947c1947b4e2cb0b1f4f97b77182), [`05f5580`](https://github.com/browserbase/stagehand/commit/05f5580937c3c157550e3c25ae6671f44f562211), [`f56a9c2`](https://github.com/browserbase/stagehand/commit/f56a9c296d4ddce25a405358c66837f8ce4d679f), [`b40ae11`](https://github.com/browserbase/stagehand/commit/b40ae11391af49c3581fce27faa1b7483fc4a169), [`0d2b398`](https://github.com/browserbase/stagehand/commit/0d2b398cd40b32a9ecaf28ede70853036b7c91bd), [`cd01f29`](https://github.com/browserbase/stagehand/commit/cd01f290578eac703521f801ba3712f5332918f3), [`a734fca`](https://github.com/browserbase/stagehand/commit/a734fca0b4573753767d3ebc48ec414baf4f23e1), [`b342acf`](https://github.com/browserbase/stagehand/commit/b342acfaae058127fb57664644c5fd965db02bf2), [`2987cd1`](https://github.com/browserbase/stagehand/commit/2987cd1e5ffabefa9411936609635d4a638faed5), [`dfab1d5`](https://github.com/browserbase/stagehand/commit/dfab1d566299c8c5a63f20565a6da07dc8f61ccd), [`4d71162`](https://github.com/browserbase/stagehand/commit/4d71162beb119635b69b17637564a2bbd0e373e7)]:
  - @browserbasehq/stagehand@3.0.7

## 1.1.5

### Patch Changes

- [#1364](https://github.com/browserbase/stagehand/pull/1364) [`ca0630e`](https://github.com/browserbase/stagehand/commit/ca0630e4d96bf86708b9ff202ad8da0d0761bda8) Thanks [@tkattkat](https://github.com/tkattkat)! - Update model handling in agent evals cli

- Updated dependencies [[`605ed6b`](https://github.com/browserbase/stagehand/commit/605ed6b81a3ff8f25d4022f1e5fce6b42aecfc19), [`34e7e5b`](https://github.com/browserbase/stagehand/commit/34e7e5b292f5e6af6efc0da60118663310c5f718), [`943d2d7`](https://github.com/browserbase/stagehand/commit/943d2d79d0f289ac41c9164578f2f1dd876058f2), [`0e95cd2`](https://github.com/browserbase/stagehand/commit/0e95cd2f67672f64f0017024fd47d8b3aef59a95), [`d4237e4`](https://github.com/browserbase/stagehand/commit/d4237e40951ecd10abfdbe766672d498f8806484), [`86975e7`](https://github.com/browserbase/stagehand/commit/86975e795db7505804949a267b20509bd16b5256), [`d5e119b`](https://github.com/browserbase/stagehand/commit/d5e119be5eec84915a79f8d611b6ba0546f48c99), [`4e051b2`](https://github.com/browserbase/stagehand/commit/4e051b23add7ae276b0dbead38b4587838cfc1c1), [`6b5a3c9`](https://github.com/browserbase/stagehand/commit/6b5a3c9035654caaed2da375085b465edda97de4), [`bb85ad9`](https://github.com/browserbase/stagehand/commit/bb85ad912738623a7a866f0cb6e8d5807c6c2738), [`88d28cc`](https://github.com/browserbase/stagehand/commit/88d28cc6f31058d1cf6ec6dc948a4ae77a926b3c), [`45bcef0`](https://github.com/browserbase/stagehand/commit/45bcef0e5788b083f9e38dfd7c3bc63afcd4b6dd), [`6aa9d45`](https://github.com/browserbase/stagehand/commit/6aa9d455aa5836ec2ee8ab2e8b9df3fb218e5381), [`d382084`](https://github.com/browserbase/stagehand/commit/d382084745fff98c3e71413371466394a2625429), [`1df08cc`](https://github.com/browserbase/stagehand/commit/1df08ccb0a2cf73b5c37a91c129721114ff6371c), [`2b56600`](https://github.com/browserbase/stagehand/commit/2b566009606fcbba987260f21b075b318690ce99)]:
  - @browserbasehq/stagehand@3.0.6

## 1.1.4

### Patch Changes

- Updated dependencies [[`fa18cfd`](https://github.com/browserbase/stagehand/commit/fa18cfdc45f28e35e6566587b54612396e6ece45), [`767d168`](https://github.com/browserbase/stagehand/commit/767d1686285cf9c57675595f553f8a891f13c63b), [`f27a99c`](https://github.com/browserbase/stagehand/commit/f27a99c11b020b33736fe67af8f7f0e663c6f45f), [`91a1ca0`](https://github.com/browserbase/stagehand/commit/91a1ca07d9178c46269bfb951abb20a215eb7c29), [`1dd7d43`](https://github.com/browserbase/stagehand/commit/1dd7d4330de9022dc6cd45a8b5c86cb9e1b575ec), [`c0f3b98`](https://github.com/browserbase/stagehand/commit/c0f3b98277c15c77b2b4c3f55503e61ef3d27cf3), [`44bb4f5`](https://github.com/browserbase/stagehand/commit/44bb4f51dcccbdca8df07e4d7f8d28a7e6e793ec), [`2b70347`](https://github.com/browserbase/stagehand/commit/2b7034771bc6d6b1fabb13deaa56c299881b3728)]:
  - @browserbasehq/stagehand@3.0.4

## 1.1.3

### Patch Changes

- Updated dependencies [[`ab51232`](https://github.com/browserbase/stagehand/commit/ab51232db428be048957c0f5d67f2176eb7a5194), [`c76ade0`](https://github.com/browserbase/stagehand/commit/c76ade009ef81208accae6475ec4707d3906e566), [`ffb5e5d`](https://github.com/browserbase/stagehand/commit/ffb5e5d2ab49adcb2efdfc9e5c76e8c96268b5b3), [`772e735`](https://github.com/browserbase/stagehand/commit/772e73543e45106d7fa0fafd95ade46ae11023bc)]:
  - @browserbasehq/stagehand@3.0.3

## 1.1.2

### Patch Changes

- Updated dependencies [[`a224b33`](https://github.com/browserbase/stagehand/commit/a224b3371b6c1470baf342742fb745c7192b52c6), [`6fc9de2`](https://github.com/browserbase/stagehand/commit/6fc9de2a1079e4f2fb0b1633d8df0bb7a9f7f89f), [`4935be7`](https://github.com/browserbase/stagehand/commit/4935be788b3431527f3d110864c0fd7060cfaf7c), [`bdd76fc`](https://github.com/browserbase/stagehand/commit/bdd76fcd1e48079fc5ab8cf040ebb5997dfc6c99), [`7ea18a4`](https://github.com/browserbase/stagehand/commit/7ea18a420fc033d1b72556db83a1f41735e5a022), [`d4de014`](https://github.com/browserbase/stagehand/commit/d4de014235a18f9e1089240bc72e28cbfe77ca1c), [`2d1b573`](https://github.com/browserbase/stagehand/commit/2d1b5732dc441a3331f5743cdfed3e1037d8b3b5), [`5556041`](https://github.com/browserbase/stagehand/commit/5556041e2deaed5012363303fd7a8ac00e3242cd), [`7e4b43e`](https://github.com/browserbase/stagehand/commit/7e4b43ed46fbdd2074827e87d9a245e2dc96456b), [`7e72adf`](https://github.com/browserbase/stagehand/commit/7e72adfd7e4af5ec49ac2f552e7f1f57c1acc554), [`9bf09d0`](https://github.com/browserbase/stagehand/commit/9bf09d041111870d71cb9ffcb3ac5fa2c4b1399d), [`92d32ea`](https://github.com/browserbase/stagehand/commit/92d32eafe91a4241615cc65501b8461c6074a02b), [`ebcf3a1`](https://github.com/browserbase/stagehand/commit/ebcf3a1ffa859374d71de4931c6a9b982a565e46), [`c29a4f2`](https://github.com/browserbase/stagehand/commit/c29a4f2eca91ae2902ed9d48b2385b4436f7b664), [`6d21efa`](https://github.com/browserbase/stagehand/commit/6d21efa8b30317aa3ce3e37ac6c2222af3b967b5), [`525ef0c`](https://github.com/browserbase/stagehand/commit/525ef0c1243aaf3452ee7e4ea81b4208f4c2efd1), [`9ddb872`](https://github.com/browserbase/stagehand/commit/9ddb872e350358214e12a91cf6a614fd2ec1f74c)]:
  - @browserbasehq/stagehand@3.0.2

## 1.1.1

### Patch Changes

- Updated dependencies [[`55da8c6`](https://github.com/browserbase/stagehand/commit/55da8c6e9575cbad3246c55b17650cf6b293ddbe), [`0a5ee63`](https://github.com/browserbase/stagehand/commit/0a5ee638bde051d109eb2266e665934a12f3dc31), [`ee76881`](https://github.com/browserbase/stagehand/commit/ee7688156cb67a9f0f90dfe0dbab77423693a332), [`9e95add`](https://github.com/browserbase/stagehand/commit/9e95add37eb30db4f85e73df7760c7e63fb4131e), [`98e212b`](https://github.com/browserbase/stagehand/commit/98e212b27887241879608c6c1b6c2524477a40d7), [`d5ecbfc`](https://github.com/browserbase/stagehand/commit/d5ecbfc8e419a59b91c2115fd7f984378381d3d0)]:
  - @browserbasehq/stagehand@3.0.1

## 1.0.9

### Patch Changes

- Updated dependencies [[`09b5e1e`](https://github.com/browserbase/stagehand/commit/09b5e1e9c23c845903686db6665cc968ac34efbb), [`e3734b9`](https://github.com/browserbase/stagehand/commit/e3734b9c98352d5f0a4eca49791b0bbf2130ab41), [`8244ab2`](https://github.com/browserbase/stagehand/commit/8244ab247cd679962685ae2f7c54e874ce1fa614), [`be85b19`](https://github.com/browserbase/stagehand/commit/be85b19679a826f19702e00f0aae72fce1118ec8), [`88d1565`](https://github.com/browserbase/stagehand/commit/88d1565c65bb65a104fea2d5f5e862bbbda69677), [`ab5d6ed`](https://github.com/browserbase/stagehand/commit/ab5d6ede19aabc059badc4247f1cb2c6c9e71bae)]:
  - @browserbasehq/stagehand@2.5.0

## 1.0.8

### Patch Changes

- Updated dependencies [[`9e8c173`](https://github.com/browserbase/stagehand/commit/9e8c17374fdc8fbe7f26e6cf802c36bd14f11039)]:
  - @browserbasehq/stagehand@2.4.4

## 1.0.7

### Patch Changes

- Updated dependencies [[`f45afdc`](https://github.com/browserbase/stagehand/commit/f45afdccc8680650755fee66ffbeac32b41e075d), [`261bba4`](https://github.com/browserbase/stagehand/commit/261bba43fa79ac3af95328e673ef3e9fced3279b), [`8de7bd8`](https://github.com/browserbase/stagehand/commit/8de7bd8635c2051cd8025e365c6c8aa83d81c7e7), [`3d80421`](https://github.com/browserbase/stagehand/commit/3d804210a106a6828c7fa50f8b765b10afd4cc6a), [`0ead63d`](https://github.com/browserbase/stagehand/commit/0ead63d6526f6c286362b74b6407c8bebc900e69), [`8422828`](https://github.com/browserbase/stagehand/commit/8422828c4cd5fd5ebcf348cfbdb40c768bb76dd9), [`b769206`](https://github.com/browserbase/stagehand/commit/b7692060f98a2f49aeeefb90d8789ed034b08ec2), [`72d2683`](https://github.com/browserbase/stagehand/commit/72d2683202af7e578d98367893964b33e0828de5)]:
  - @browserbasehq/stagehand@2.4.3

## 1.0.6

### Patch Changes

- Updated dependencies [[`6b4e6e3`](https://github.com/browserbase/stagehand/commit/6b4e6e3f31d5496cf15728e9018eddeb04839542), [`e77d018`](https://github.com/browserbase/stagehand/commit/e77d0188683ebf596dfb78dfafbbca1dc32993f0), [`c20adb9`](https://github.com/browserbase/stagehand/commit/c20adb95539fed8c56a4aa413262a9c65a8e6474), [`b86df93`](https://github.com/browserbase/stagehand/commit/b86df93b9136aae96292121a29c25f3d74d84bf7), [`023c2c2`](https://github.com/browserbase/stagehand/commit/023c2c273b46d3792d7e5d3c902089487b16b531), [`8c28647`](https://github.com/browserbase/stagehand/commit/8c2864755ecd05c8f7de235d4198deec0dd5f78e), [`87e09c6`](https://github.com/browserbase/stagehand/commit/87e09c618940f364ec8af00455a19a17ec63cbd3), [`a611115`](https://github.com/browserbase/stagehand/commit/a61111525d70b450bdfc43f112380f44899c9e97), [`69913fe`](https://github.com/browserbase/stagehand/commit/69913fe1dfb8201ae2aeffa5f049fb46ab02cbc2), [`b1b83a1`](https://github.com/browserbase/stagehand/commit/b1b83a1d334fe76e5f5f9dd32dc92c16b7d40ce6), [`be8497c`](https://github.com/browserbase/stagehand/commit/be8497cb6b142cc893cea9692b8c47bd19514c60), [`98704c9`](https://github.com/browserbase/stagehand/commit/98704c9ed225ca25bbde4bb3dc286936e9c54471), [`04978bd`](https://github.com/browserbase/stagehand/commit/04978bdd30d2edcbc69eb9fd91358a16975ea2eb)]:
  - @browserbasehq/stagehand@2.4.2

## 1.0.5

### Patch Changes

- Updated dependencies [[`8a43c5a`](https://github.com/browserbase/stagehand/commit/8a43c5a86d4da40cfaedd9cf2e42186928bdf946), [`890ffcc`](https://github.com/browserbase/stagehand/commit/890ffccac5e0a60ade64a46eb550c981ffb3e84a), [`64c1072`](https://github.com/browserbase/stagehand/commit/64c10727bda50470483a3eb175c02842db0923a1), [`b077d3f`](https://github.com/browserbase/stagehand/commit/b077d3f48a97f47a71ccc79ae39b41e7f07f9c04), [`8bcb5d7`](https://github.com/browserbase/stagehand/commit/8bcb5d77debf6bf7601fd5c090efd7fde75c5d5e), [`7bf10c5`](https://github.com/browserbase/stagehand/commit/7bf10c55b267078fe847c1d7f7a60d604f9c7c94)]:
  - @browserbasehq/stagehand@2.4.1

## 1.0.4

### Patch Changes

- [#831](https://github.com/browserbase/stagehand/pull/831) [`5812b02`](https://github.com/browserbase/stagehand/commit/5812b027e4919d005321cc00626b057e6e04074b) Thanks [@seanmcguire12](https://github.com/seanmcguire12)! - added -man & -h commands for explaining how to run evals

- Updated dependencies [[`124e0d3`](https://github.com/browserbase/stagehand/commit/124e0d3bb54ddb6738ede6d7aa99a945ef1cacd1), [`6a18c1e`](https://github.com/browserbase/stagehand/commit/6a18c1ee1e46d55c6e90c4d5572e17ed8daa140c), [`1660751`](https://github.com/browserbase/stagehand/commit/1660751cd14cb5b27d44f8167216afb8d1c3c45c), [`cadac9d`](https://github.com/browserbase/stagehand/commit/cadac9da09123d12e5d496a0e8b12660964c1b33), [`759da55`](https://github.com/browserbase/stagehand/commit/759da55775eb2df81d56ae18c0f386fd9b02a9f0), [`a175a51`](https://github.com/browserbase/stagehand/commit/a175a519b8c14300db6f1ed30709e113d18e99db), [`8527a80`](https://github.com/browserbase/stagehand/commit/8527a80522c3eedb9516a6caa1a0e4e4be981a3d), [`55fca2f`](https://github.com/browserbase/stagehand/commit/55fca2f7da63cc0ef6e27b45a33f63c666cdce7e)]:
  - @browserbasehq/stagehand@2.4.0

## 1.0.3

### Patch Changes

- Updated dependencies [[`12a99b3`](https://github.com/browserbase/stagehand/commit/12a99b398d8a4c3eea3ca69a3cf793faaaf4aea3), [`2451797`](https://github.com/browserbase/stagehand/commit/2451797f64c0efa4a72fd70265110003c8d0a6cd), [`1d631a5`](https://github.com/browserbase/stagehand/commit/1d631a57a197390f672b718ae5199991ab27cfb1), [`9c398bb`](https://github.com/browserbase/stagehand/commit/9c398bb9ec2d10bdb53ad5aa7e3b58cce24fdb2b), [`c19ad7f`](https://github.com/browserbase/stagehand/commit/c19ad7f1e082e91fdeaa9c2ef63767a5a2b3a195)]:
  - @browserbasehq/stagehand@2.3.1

## 1.0.2

### Patch Changes

- Updated dependencies [[`5680d25`](https://github.com/browserbase/stagehand/commit/5680d2509352c383ad502c9f4fabde01fa638833), [`4de92a8`](https://github.com/browserbase/stagehand/commit/4de92a8af461fc95063faf39feee1d49259f58ba), [`6ef6073`](https://github.com/browserbase/stagehand/commit/6ef60730cab0ad9025f44b6eeb2c83751d1dcd35)]:
  - @browserbasehq/stagehand@2.3.0

## 1.0.1

### Patch Changes

- Updated dependencies [[`be8652e`](https://github.com/browserbase/stagehand/commit/be8652e770b57fdb3299fa0b2efa4eb0e816434e), [`6b413b7`](https://github.com/browserbase/stagehand/commit/6b413b7ad00b13ca0bd53ee2e7393023821408b6), [`7eafbd9`](https://github.com/browserbase/stagehand/commit/7eafbd9b1a73b37effa444929767df7c592caf02), [`1b50aa6`](https://github.com/browserbase/stagehand/commit/1b50aa61cf0a429dd6cb2760a08f7f698a50454b), [`f2b7f1f`](https://github.com/browserbase/stagehand/commit/f2b7f1f284eef1f96753319b66c7d0b273a6f8cd), [`c8d672f`](https://github.com/browserbase/stagehand/commit/c8d672f7c410c256defbc2e87ead99239837aa28), [`bebf204`](https://github.com/browserbase/stagehand/commit/bebf2044502333c694743078c5b0c9deae11fb79), [`37d6810`](https://github.com/browserbase/stagehand/commit/37d6810a704773d0383a86f98f5f17c7d5b21975)]:
  - @browserbasehq/stagehand@2.2.1


================================================
FILE: packages/evals/README.md
================================================
# Stagehand Evals CLI

A powerful command-line interface for running Stagehand evaluation suites and benchmarks.

## Installation

```bash
# From the stagehand root directory
pnpm install
pnpm run build:cli
```

## Usage

The evals CLI provides a clean, intuitive interface for running evaluations:

```bash
pnpm evals <command> <target> [options]
```

## Commands

### `run` - Execute evaluations

Run custom evals or external benchmarks.

```bash
# Run all custom evals
pnpm evals run all

# Run specific category
pnpm evals run act
pnpm evals run extract
pnpm evals run observe

# Run specific eval by name
pnpm evals run extract/extract_text

# Run external benchmarks
pnpm evals run benchmark:gaia
```

### `list` - View available evals

List all available evaluations and benchmarks.

```bash
# List all categories and benchmarks
pnpm evals list

# Show detailed task list
pnpm evals list --detailed
```

### `config` - Manage defaults

Configure default settings for all eval runs.

```bash
# View current configuration
pnpm evals config

# Set default values
pnpm evals config set env browserbase
pnpm evals config set trials 5
pnpm evals config set concurrency 10

# Reset to defaults
pnpm evals config reset
pnpm evals config reset trials  # Reset specific key
```

### `help` - Show help

```bash
pnpm evals help
```

## Options

### Core Options

- `-e, --env` - Environment: `local` or `browserbase` (default: local)
- `-t, --trials` - Number of trials per eval (default: 3)
- `-c, --concurrency` - Max parallel sessions (default: 3)
- `-m, --model` - Model override (e.g., gpt-4o, claude-3.5)
- `-p, --provider` - Provider override (openai, anthropic, etc.)
- `--api` - Use Stagehand API instead of SDK

### Benchmark-Specific Options

- `-l, --limit` - Max tasks to run (default: 25)
- `-s, --sample` - Random sample before limit
- `-f, --filter` - Benchmark-specific filters (key=value)

## Examples

### Running Custom Evals

```bash
# Run with custom settings
pnpm evals run act -e browserbase -t 5 -c 10

# Run with specific model
pnpm evals run observe -m gpt-4o -p openai

# Run using API
pnpm evals run extract --api
```

### Running Benchmarks

```bash
# WebBench with filters
pnpm evals run b:webbench -l 10 -f difficulty=easy -f category=READ

# GAIA with sampling
pnpm evals run b:gaia -s 100 -l 25 -f level=1

# WebVoyager with limit
pnpm evals run b:webvoyager -l 50
```

## Available Benchmarks

### OnlineMind2Web (`b:onlineMind2Web`)

Real-world web interaction tasks for evaluating web agents.

### GAIA (`b:gaia`)

General AI Assistant benchmark for complex reasoning.

**Filters:**

- `level`: 1, 2, 3 (difficulty levels)

### WebVoyager (`b:webvoyager`)

Web navigation and task completion benchmark.

### WebBench (`b:webbench`)

Real-world web automation tasks across live websites.

**Filters:**

- `difficulty`: easy, hard
- `category`: READ, CREATE, UPDATE, DELETE, FILE_MANIPULATION
- `use_hitl`: true/false

### OSWorld (`b:osworld`)

Chrome browser automation tasks from the OSWorld benchmark.

**Filters:**

- `source`: Mind2Web, test_task_1, etc.
- `evaluation_type`: url_match, string_match, dom_state, custom

## Configuration

The CLI uses a configuration file at `evals/evals.config.json` which contains:

- **defaults**: Default values for CLI options
- **benchmarks**: Metadata for external benchmarks
- **tasks**: Registry of all evaluation tasks

You can modify defaults either through the `config` command or by editing the file directly.

## Environment Variables

While the CLI reduces the need for environment variables, some are still supported for CI/CD:

- `EVAL_ENV` - Override environment setting
- `EVAL_TRIAL_COUNT` - Override trial count
- `EVAL_MAX_CONCURRENCY` - Override concurrency
- `EVAL_PROVIDER` - Override LLM provider
- `USE_API` - Use Stagehand API

## Development

### Adding New Evals

1. Create your eval file in `evals/tasks/<category>/`
2. Add it to `evals.config.json` under the `tasks` array
3. Run with: `pnpm evals run <category>/<eval_name>`

## Troubleshooting

### Command not found

If `evals` command is not found, make sure you've:

1. Run `pnpm install` from the project root
2. Run `pnpm run build:cli` to compile the CLI

### Build errors

If you encounter build errors:

```bash
# Clean and rebuild
rm -rf packages/evals/dist/cli
pnpm run build:cli
```

### Permission errors

If you get permission errors:

```bash
chmod +x packages/evals/dist/cli/cli.js
```

## Contributing

When adding new features to the CLI:

1. Update the command in `evals/cli.ts`
2. Add new options to the help text
3. Update this README with examples
4. Test with various flag combinations


================================================
FILE: packages/evals/args.ts
================================================
import process from "process";
import { EvalCategorySchema } from "./types/evals.js";
import chalk from "chalk";
import { dedent } from "./utils.js";

const HELP_REGEX = /^(?:--?)?(?:h|help)$/i;
const MAN_REGEX = /^(?:--?)?man$/i;

const rawArgs = process.argv.slice(2);

const parsedArgs: {
  evalName?: string;
  env?: string;
  api?: string;
  trials?: number;
  concurrency?: number;
  provider?: string;
  dataset?: string;
  max_k?: number;
  leftover: string[];
} = {
  leftover: [],
};

for (const arg of rawArgs) {
  if (arg.startsWith("env=")) {
    parsedArgs.env = arg.split("=")[1]?.toLowerCase();
  } else if (arg.startsWith("api=")) {
    parsedArgs.api = arg.split("=")[1]?.toLowerCase();
  } else if (arg.startsWith("name=")) {
    parsedArgs.evalName = arg.split("=")[1];
  } else if (arg.startsWith("trials=")) {
    const val = parseInt(arg.split("=")[1], 10);
    if (!isNaN(val)) {
      parsedArgs.trials = val;
    }
  } else if (arg.startsWith("concurrency=")) {
    const val = parseInt(arg.split("=")[1], 10);
    if (!isNaN(val)) {
      parsedArgs.concurrency = val;
    }
  } else if (arg.startsWith("provider=")) {
    parsedArgs.provider = arg.split("=")[1]?.toLowerCase();
  } else if (arg.startsWith("--dataset=")) {
    parsedArgs.dataset = arg.split("=")[1]?.toLowerCase();
  } else if (arg.startsWith("max_k=")) {
    const val = parseInt(arg.split("=")[1], 10);
    if (!isNaN(val)) {
      parsedArgs.max_k = val;
    }
  } else {
    parsedArgs.leftover.push(arg);
  }
}

/** Apply environment defaults or overrides */
if (parsedArgs.env === "browserbase") {
  process.env.EVAL_ENV = "BROWSERBASE";
} else if (parsedArgs.env === "local") {
  process.env.EVAL_ENV = "LOCAL";
}

if (parsedArgs.api === "true") {
  process.env.USE_API = "true";
} else if (parsedArgs.api === "false") {
  process.env.USE_API = "false";
}

if (parsedArgs.trials !== undefined) {
  process.env.EVAL_TRIAL_COUNT = String(parsedArgs.trials);
}
if (parsedArgs.concurrency !== undefined) {
  process.env.EVAL_MAX_CONCURRENCY = String(parsedArgs.concurrency);
}
if (parsedArgs.max_k !== undefined) {
  process.env.EVAL_MAX_K = String(parsedArgs.max_k);
}
if (parsedArgs.dataset !== undefined) {
  process.env.EVAL_DATASET = parsedArgs.dataset;
}

const DEFAULT_EVAL_CATEGORIES = process.env.EVAL_CATEGORIES
  ? process.env.EVAL_CATEGORIES.split(",")
  : [
      "observe",
      "act",
      "combination",
      "extract",
      "experimental",
      "targeted_extract",
      "regression_llm_providers",
      "regression",
      "llm_clients",
      "agent",
      "external_agent_benchmarks",
    ];

const providerDefault = process.env.EVAL_PROVIDER ?? undefined;

function buildUsage(detailed = false): string {
  const header = chalk.blue.bold("Stagehand • Eval Runner");
  const synopsis = chalk.cyan(
    `pnpm run evals [key=value]… [category <name>] | name=<evalName>`,
  );

  const examplesSection = `
      ${chalk.magenta.underline("Examples")}

      ${chalk.dim("# Run every evaluation locally with default settings")}
      ${chalk.green("pnpm run evals")}

      ${chalk.dim("# Same as above but in Browserbase with three trials")}  
      ${chalk.green("pnpm run evals")} ${chalk.cyan("env=")}${chalk.yellow("browserbase")} ${chalk.cyan("trials=")}${chalk.yellow("3")}

      ${chalk.dim("# Run evals using the Stagehand API")}
      ${chalk.green("pnpm run evals")} ${chalk.cyan("env=")}${chalk.yellow("browserbase")} ${chalk.cyan("api=")}${chalk.yellow("true")}

      ${chalk.dim("# Run evals from only the 'act' category with a max of 4 running at any given time")}
      ${chalk.green("pnpm run evals")} ${chalk.cyan("category")} ${chalk.yellow("act")} ${chalk.cyan("concurrency=")}${chalk.yellow("4")}

      ${chalk.dim("# Execute a specific eval by filename")}
      ${chalk.green("pnpm run evals")} ${chalk.cyan("name=")}${chalk.yellow("my_eval_name")}
  `;

  const body = dedent`
    ${chalk.magenta.underline("Keys\n")}
  ${chalk.cyan("env".padEnd(12))} ${"target environment".padEnd(24)}
    (default ${chalk.dim("LOCAL")})                [${chalk.yellow("browserbase")}, ${chalk.yellow("local")}]

  ${chalk.cyan("api".padEnd(12))} ${"use the Stagehand API".padEnd(24)}
    (default ${chalk.dim("false")})                [${chalk.yellow("true")}, ${chalk.yellow("false")}]

  ${chalk.cyan("trials".padEnd(12))} ${"number of trials per task".padEnd(24)}
    (default ${chalk.dim("3")})

  ${chalk.cyan("concurrency".padEnd(12))} ${"max parallel sessions".padEnd(24)}
    (default ${chalk.dim("3")})

  ${chalk.cyan("provider".padEnd(12))} ${"override LLM provider".padEnd(24)}
    (default ${chalk.dim(providerDefault || "varies by model")})        [${chalk.yellow("openai")}, ${chalk.yellow("anthropic")}, ${chalk.yellow("google")}, ${chalk.yellow("together")}, ${chalk.yellow("groq")}, ${chalk.yellow("cerebras")}]

  ${chalk.cyan("max_k".padEnd(12))} ${"max test cases per dataset".padEnd(24)}
    (default ${chalk.dim("25")})

  ${chalk.cyan("--dataset".padEnd(12))} ${"filter to specific benchmark".padEnd(24)}
    (optional)              [${chalk.yellow("gaia")}, ${chalk.yellow("webvoyager")}, ${chalk.yellow("webbench")}, ${chalk.yellow("osworld")}, ${chalk.yellow("onlineMind2Web")}]


    ${chalk.magenta.underline("Positional filters\n")}
      
      category <category_name>   
      
        ${chalk.gray("Available categories:")}
        ${DEFAULT_EVAL_CATEGORIES.slice(0, 5)
          .map((c) => chalk.yellow(c))
          .join(", ")},
        ${DEFAULT_EVAL_CATEGORIES.slice(5, 10)
          .map((c) => chalk.yellow(c))
          .join(", ")}${DEFAULT_EVAL_CATEGORIES.slice(10).length > 0 ? "," : ""}
        ${DEFAULT_EVAL_CATEGORIES.slice(10)
          .map((c) => chalk.yellow(c))
          .join(", ")}
  `;

  if (!detailed)
    return `${header}\n\n${synopsis}\n\nFor more details: ${chalk.bold(
      "pnpm run evals -man\n",
    )}`;

  const externalBenchmarksSection = dedent`
    ${chalk.magenta.underline("\nExternal Benchmarks\n")}
    
    ${chalk.cyan.bold("WebBench")} - 5,607 real-world web automation tasks across 452 live websites
    
      ${chalk.dim("Run:")} ${chalk.green("pnpm run evals")} ${chalk.cyan("name=")}${chalk.yellow("agent/webbench")}
      
      ${chalk.dim("Or:")}  ${chalk.green("EVAL_DATASET=webbench pnpm run evals")}
      
      ${chalk.gray("Environment Variables:")}
      
      EVAL_WEBBENCH_LIMIT       max tasks to run (default: 25)
      EVAL_WEBBENCH_SAMPLE      random sample count before limit
      EVAL_WEBBENCH_DIFFICULTY  filter: [${chalk.yellow("easy")}, ${chalk.yellow("hard")}] (254 easy, 61 hard tasks)
      EVAL_WEBBENCH_CATEGORY    filter: [${chalk.yellow("READ")}, ${chalk.yellow("CREATE")}, ${chalk.yellow("UPDATE")}, ${chalk.yellow("DELETE")}, ${chalk.yellow("FILE_MANIPULATION")}]
      EVAL_WEBBENCH_USE_HITL    use only HITL dataset with difficulty ratings (true/false)
      
      ${chalk.dim("Examples:")}
      
      ${chalk.green("EVAL_WEBBENCH_DIFFICULTY=easy EVAL_WEBBENCH_LIMIT=10 pnpm run evals name=agent/webbench")}
      
      ${chalk.green("EVAL_DATASET=webbench EVAL_WEBBENCH_CATEGORY=READ pnpm run evals")}
    
    
    ${chalk.cyan.bold("GAIA")} - General AI Assistant benchmark for complex reasoning
    
      ${chalk.dim("Run:")} ${chalk.green("pnpm run evals")} ${chalk.cyan("name=")}${chalk.yellow("agent/gaia")}
      
      ${chalk.dim("Or:")}  ${chalk.green("EVAL_DATASET=gaia pnpm run evals")}
      
      ${chalk.gray("Environment Variables:")}
      
      EVAL_GAIA_LIMIT           max tasks to run (default: 25)
      EVAL_GAIA_SAMPLE          random sample count before limit
      EVAL_GAIA_LEVEL           filter by difficulty level [${chalk.yellow("1")}, ${chalk.yellow("2")}, ${chalk.yellow("3")}]
      
      ${chalk.dim("Example:")}
      
      ${chalk.green("EVAL_GAIA_LEVEL=1 EVAL_GAIA_LIMIT=10 pnpm run evals name=agent/gaia")}
    
    
    ${chalk.cyan.bold("WebVoyager")} - Web navigation and task completion benchmark
    
      ${chalk.dim("Run:")} ${chalk.green("pnpm run evals")} ${chalk.cyan("name=")}${chalk.yellow("agent/webvoyager")}
      
      ${chalk.dim("Or:")}  ${chalk.green("EVAL_DATASET=webvoyager pnpm run evals")}
      
      ${chalk.gray("Environment Variables:")}
      
      EVAL_WEBVOYAGER_LIMIT     max tasks to run (default: 25)
      EVAL_WEBVOYAGER_SAMPLE    random sample count before limit
      
      ${chalk.gray("Ground Truth Evaluation:")}
      
      WebVoyager uses ground truth answers for improved accuracy:
      • Checks agent's "Final Answer:" against reference answers
      • Supports golden (ideal) and possible (acceptable) answers
      • Falls back to screenshot evaluation when uncertain
      • Reference data: evals/datasets/webvoyager/reference-answers.json
      
      ${chalk.dim("Example:")}
      
      ${chalk.green("EVAL_WEBVOYAGER_SAMPLE=50 EVAL_WEBVOYAGER_LIMIT=10 pnpm run evals name=agent/webvoyager")}
    
    
    ${chalk.cyan.bold("OSWorld")} - Chrome browser automation tasks from the OSWorld benchmark
    
      ${chalk.dim("Run:")} ${chalk.green("pnpm run evals")} ${chalk.cyan("name=")}${chalk.yellow("agent/osworld")}
      
      ${chalk.dim("Or:")}  ${chalk.green("EVAL_DATASET=osworld pnpm run evals")}
      
      ${chalk.gray("Environment Variables:")}
      
      EVAL_OSWORLD_LIMIT           max tasks to run (default: 25)
      EVAL_OSWORLD_SAMPLE          random sample count before limit
      EVAL_OSWORLD_SOURCE          filter by source: [${chalk.yellow("Mind2Web")}, ${chalk.yellow("test_task_1")}, ...]
      EVAL_OSWORLD_EVALUATION_TYPE filter by eval type: [${chalk.yellow("url_match")}, ${chalk.yellow("string_match")}, ${chalk.yellow("dom_state")}, ${chalk.yellow("custom")}]
      EVAL_OSWORLD_TIMEOUT         timeout per task in milliseconds (default: 60000)
      
      ${chalk.dim("Examples:")}
      
      ${chalk.green("EVAL_OSWORLD_SOURCE=Mind2Web EVAL_OSWORLD_LIMIT=10 pnpm run evals name=agent/osworld")}
      
      ${chalk.green("EVAL_DATASET=osworld EVAL_OSWORLD_EVALUATION_TYPE=url_match pnpm run evals")}
    
    
    ${chalk.cyan.bold("Mind2Web")} - Real-world web interaction tasks for evaluating web agents
    
      ${chalk.dim("Run:")} ${chalk.green("pnpm run evals")} ${chalk.cyan("name=")}${chalk.yellow("agent/onlineMind2Web")}
      
      ${chalk.dim("Or:")}  ${chalk.green("EVAL_DATASET=onlineMind2Web pnpm run evals")}
      
      ${chalk.gray("Environment Variables:")}
      
      EVAL_ONLINEMIND2WEB_LIMIT     max tasks to run (default: 25)
      EVAL_ONLINEMIND2WEB_SAMPLE    random sample count before limit
      
      ${chalk.dim("Example:")}
      
      ${chalk.green("EVAL_ONLINEMIND2WEB_SAMPLE=50 EVAL_ONLINEMIND2WEB_LIMIT=10 pnpm run evals name=agent/onlineMind2Web")}
  `;

  const envSection = dedent`
    ${chalk.magenta.underline("\nGlobal Environment Variables\n")}
      
      EVAL_ENV              target environment, overridable via ${chalk.cyan("env=")}
      
      EVAL_TRIAL_COUNT      number of trials, overridable via ${chalk.cyan("trials=")}
      
      EVAL_MAX_CONCURRENCY  parallel sessions, overridable via ${chalk.cyan("concurrency=")}
      
      EVAL_PROVIDER         LLM provider, overridable via ${chalk.cyan("provider=")}
      
      EVAL_MAX_K            global limit for all benchmarks (overrides individual limits)
      
      EVAL_DATASET          filter to specific benchmark, overridable via ${chalk.cyan("--dataset=")}
      
      USE_API               use Stagehand API, overridable via ${chalk.cyan("api=")}
      
      EVAL_MODELS           comma-separated list of models to use
      
      AGENT_EVAL_MAX_STEPS  max steps for agent tasks (default: 50)
  `;

  return `${header}\n\n${synopsis}\n\n${body}\n${examplesSection}\n${externalBenchmarksSection}\n${envSection}\n`;
}

const wantsHelp = rawArgs.some((a) => HELP_REGEX.test(a));
const wantsMan = rawArgs.some((a) => MAN_REGEX.test(a));

if (wantsHelp || wantsMan) {
  console.log(buildUsage(wantsMan));
  process.exit(0);
}

let filterByCategory: string | null = null;
let filterByEvalName: string | null = null;

if (parsedArgs.evalName) {
  filterByEvalName = parsedArgs.evalName;
}

if (!filterByEvalName && parsedArgs.leftover.length > 0) {
  if (parsedArgs.leftover[0].toLowerCase() === "category") {
    filterByCategory = parsedArgs.leftover[1];
    if (!filterByCategory) {
      console.error(chalk.red("Error: Category name not specified."));
      process.exit(1);
    }
    try {
      EvalCategorySchema.parse(filterByCategory);
    } catch {
      console.error(
        chalk.red(
          `Error: Invalid category "${filterByCategory}". Valid categories are: ${DEFAULT_EVAL_CATEGORIES.join(
            ", ",
          )}`,
        ),
      );
      process.exit(1);
    }
  } else {
    // If leftover[0] is not "category", interpret it as a task/eval name
    filterByEvalName = parsedArgs.leftover[0];
  }
}

if (parsedArgs.provider !== undefined) {
  process.env.EVAL_PROVIDER = parsedArgs.provider;
}

export {
  filterByCategory,
  filterByEvalName,
  DEFAULT_EVAL_CATEGORIES,
  parsedArgs,
};


================================================
FILE: packages/evals/assets/cart.html
================================================
<!doctype html>
<html lang="en">
  <head>
    <meta charset="UTF-8" />
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <title>Document</title>
  </head>
  <body>
    <script>
      function getQueryParam(param) {
        const urlParams = new URLSearchParams(window.location.search);
        return urlParams.get(param);
      }
      const item = getQueryParam("item");
      document.addEventListener("DOMContentLoaded", function () {
        document.getElementById("cartItem").textContent =
          `Congratulations, you have 1 ${item} in your cart`;
      });
    </script>
    <div id="cartItem"></div>
  </body>
</html>


================================================
FILE: packages/evals/assets/peeler.html
================================================
<!doctype html>
<html lang="en">
  <head>
    <meta charset="UTF-8" />
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <title>Document</title>
  </head>
  <body>
    <h1>Welcome to Our Page</h1>

    <div class="product-card">
      <div class="product-info">
        <h2>Knife Set</h2>
        <p>
          High-quality stainless steel knives for all your cooking needs.<a
            >my stuff</a
          >
          more stuff
        </p>
      </div>
      <button onclick="location.href='cart.html?item=B'">Add to cart</button>
    </div>
    <div class="product-card">
      <div class="product-info">
        <h2>Peeler</h2>
        <p>The ultimate tool for peeling fruits and vegetables.</p>
      </div>
      <button onclick="location.href='cart.html?item=A'">Add to cart</button>
    </div>
    <a href="cart.html" aria-role="button">
      <div>hi world</div>
    </a>
    <p>
      Baseball evolved from older
      <a href="/wiki/Bat-and-ball_games" title="Bat-and-ball games"
        >bat-and-ball games</a
      >
      already being played in England by the mid-18th century. This game was
      brought by immigrants to North America,
      <a
        href="/wiki/History_of_baseball_in_the_United_States"
        title="History of baseball in the United States"
        >where the modern version developed</a
      >.
    </p>
  </body>
</html>


================================================
FILE: packages/evals/browserbaseCleanup.ts
================================================
import type { V3 } from "@browserbasehq/stagehand";

const CLOSE_TIMEOUT_MS = 5_000;

async function settleWithTimeout(
  promise: Promise<unknown>,
  timeoutMs: number,
): Promise<void> {
  let timeoutId: NodeJS.Timeout | undefined;
  const timeout = new Promise<void>((resolve) => {
    timeoutId = setTimeout(resolve, timeoutMs);
  });
  try {
    await Promise.race([promise.catch(() => {}), timeout]);
  } finally {
    if (timeoutId) clearTimeout(timeoutId);
  }
}

export async function endBrowserbaseSession(v3?: V3 | null): Promise<void> {
  if (!v3?.isBrowserbase) return;
  if ((process.env.USE_API ?? "").toLowerCase() === "true") return;

  try {
    await settleWithTimeout(
      v3.context.conn.send("Browser.close"),
      CLOSE_TIMEOUT_MS,
    );
  } catch {
    // best-effort cleanup
  }
}


================================================
FILE: packages/evals/cli.ts
================================================
import process from "process";
import chalk from "chalk";
import fs from "fs";
import path from "path";
import { spawn } from "child_process";
import { getCurrentDirPath } from "./runtimePaths.js";

const moduleDir = getCurrentDirPath();
const CONFIG_PATH = path.join(moduleDir, "evals.config.json");

interface Config {
  defaults: {
    env: string;
    trials: number;
    concurrency: number;
    provider: string | null;
    model: string | null;
    api: boolean;
  };
  benchmarks: Record<
    string,
    {
      limit: number;
      filters?: string[];
      timeout?: number;
    }
  >;
  tasks: Array<{ name: string; categories: string[] }>;
}

function loadConfig(): Config {
  return JSON.parse(fs.readFileSync(CONFIG_PATH, "utf-8"));
}

function saveConfig(config: Config): void {
  fs.writeFileSync(CONFIG_PATH, JSON.stringify(config, null, 2));
}

function printHelp(): void {
  console.log(
    chalk.yellow(`⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⢠⡾⠻⣶⡀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⢠⡶⠛⢳⡆⠀⠀⠀⠀⢸⡇⠀⢸⡇⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⢸⡇⠀⢸⣷⠶⣦⣴⠶⣾⡇⠀⢸⡇⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⢸⡇⠀⢸⡇⠀⢸⡇⠀⢸⡇⠀⢸⡇⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⢸⡇⠀⠘⠷⣤⢾⡏⠉⠉⠉⠙⣾⡇⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⢸⡇⠀⠀⠀⠀⠈⣻⡿⠟⠂⠀⣿⠃⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠈⣷⠀⠀⠀⠀⢰⡏⠀⠀⠀⢀⣿⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠙⣷⡀⠀⠀⠀⠀⠀⠀⢀⡾⠁⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠈⠙⠷⣦⣤⣤⣴⠾⠋⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀
⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀⠀`),
  );
  console.log(chalk.yellow.bold("\nStagehand Evals CLI"));
  console.log(chalk.cyan("\nevals <command> <target> [options]\n"));

  console.log(chalk.magenta.underline("Commands"));
  console.log("  run       Execute evals or benchmarks");
  console.log("  list      List available evals/benchmarks");
  console.log("  config    Get/set default configuration");
  console.log("  help      Show this help message\n");

  console.log(chalk.magenta.underline("Examples"));
  console.log(chalk.dim("  # Run all custom evals"));
  console.log(chalk.green("  evals run all\n"));

  console.log(chalk.dim("  # Run specific category"));
  console.log(
    chalk.green("  evals run act") + chalk.cyan(" -e browserbase -t 5\n"),
  );

  console.log(chalk.dim("  # Run specific eval"));
  console.log(chalk.green("  evals run login\n"));

  console.log(chalk.dim("  # Run benchmark"));
  console.log(
    chalk.green("  evals run benchmark:onlineMind2Web") +
      chalk.cyan(" -l 10 -f difficulty=easy\n"),
  );

  console.log(chalk.dim("  # Configure defaults"));
  console.log(chalk.green("  evals config set env browserbase"));
  console.log(chalk.green("  evals config set trials 5\n"));

  console.log(chalk.magenta.underline("Options"));
  console.log(
    chalk.cyan("  -e, --env".padEnd(20)) + "Environment: local|browserbase",
  );
  console.log(
    chalk.cyan("  -t, --trials".padEnd(20)) + "Number of trials per eval",
  );
  console.log(
    chalk.cyan("  -c, --concurrency".padEnd(20)) + "Max parallel sessions",
  );
  console.log(chalk.cyan("  -m, --model".padEnd(20)) + "Model override");
  console.log(chalk.cyan("  -p, --provider".padEnd(20)) + "Provider override");
  console.log(chalk.cyan("  --api".padEnd(20)) + "Use Stagehand API\n");

  console.log(chalk.dim("  Benchmark-specific:"));
  console.log(chalk.cyan("  -l, --limit".padEnd(20)) + "Max tasks to run");
  console.log(
    chalk.cyan("  -s, --sample".padEnd(20)) + "Random sample before limit",
  );
  console.log(
    chalk.cyan("  -f, --filter".padEnd(20)) + "Benchmark filters (key=value)\n",
  );
}

function handleConfig(args: string[]): void {
  const config = loadConfig();

  if (args.length === 0) {
    // Show current config
    console.log(chalk.blue.bold("\nCurrent Configuration"));
    console.log(chalk.cyan("\nDefaults:"));
    Object.entries(config.defaults).forEach(([key, value]) => {
      console.log(`  ${key}: ${chalk.yellow(value ?? "not set")}`);
    });
    return;
  }

  if (args[0] === "set" && args.length >= 3) {
    const [, key, ...valueParts] = args;
    const value = valueParts.join(" ");

    if (!(key in config.defaults)) {
      console.error(chalk.red(`Error: Unknown config key "${key}"`));
      console.log(
        chalk.dim(`Valid keys: ${Object.keys(config.defaults).join(", ")}`),
      );
      process.exit(1);
    }

    // Parse value based on type
    let parsedValue: string | number | boolean | null = value;
    if (key === "trials" || key === "concurrency") {
      parsedValue = parseInt(value, 10);
      if (isNaN(parsedValue)) {
        console.error(chalk.red(`Error: ${key} must be a number`));
        process.exit(1);
      }
    } else if (key === "api") {
      parsedValue = value === "true";
    } else if (value === "null" || value === "none") {
      parsedValue = null;
    }

    // Type-safe assignment
    if (key === "env") {
      config.defaults.env = parsedValue as string;
    } else if (key === "trials") {
      config.defaults.trials = parsedValue as number;
    } else if (key === "concurrency") {
      config.defaults.concurrency = parsedValue as number;
    } else if (key === "provider") {
      config.defaults.provider = parsedValue as string | null;
    } else if (key === "model") {
      config.defaults.model = parsedValue as string | null;
    } else if (key === "api") {
      config.defaults.api = parsedValue as boolean;
    }
    saveConfig(config);
    console.log(chalk.green(`✓ Set ${key} to ${parsedValue}`));
  } else if (args[0] === "reset") {
    const defaultConfig: Config["defaults"] = {
      env: "local",
      trials: 3,
      concurrency: 3,
      provider: null,
      model: null,
      api: false,
    };

    if (args[1] && args[1] in config.defaults) {
      const key = args[1];
      // Type-safe reset by key
      if (key === "env") {
        config.defaults.env = defaultConfig.env;
      } else if (key === "trials") {
        config.defaults.trials = defaultConfig.trials;
      } else if (key === "concurrency") {
        config.defaults.concurrency = defaultConfig.concurrency;
      } else if (key === "provider") {
        config.defaults.provider = defaultConfig.provider;
      } else if (key === "model") {
        config.defaults.model = defaultConfig.model;
      } else if (key === "api") {
        config.defaults.api = defaultConfig.api;
      }
      saveConfig(config);
      console.log(chalk.green(`✓ Reset ${args[1]} to default`));
    } else if (!args[1]) {
      config.defaults = defaultConfig;
      saveConfig(config);
      console.log(chalk.green("✓ Reset all settings to defaults"));
    } else {
      console.error(chalk.red(`Error: Unknown config key "${args[1]}"`));
      process.exit(1);
    }
  } else if (args[0] === "path") {
    console.log(CONFIG_PATH);
  } else {
    console.error(chalk.red("Error: Invalid config command"));
    console.log(
      chalk.dim("Usage: evals config [set <key> <value> | reset [key] | path]"),
    );
    process.exit(1);
  }
}

function handleList(args: string[]): void {
  const config = loadConfig();

  console.log(chalk.blue.bold("\nAvailable Evals\n"));

  // Group tasks by category
  const categories = new Map<string, string[]>();
  config.tasks.forEach((task) => {
    task.categories.forEach((cat) => {
      if (!categories.has(cat)) {
        categories.set(cat, []);
      }
      categories.get(cat)!.push(task.name);
    });
  });

  // Show custom eval categories
  console.log(chalk.magenta.underline("Custom Eval Categories"));
  Array.from(categories.entries())
    .filter(([cat]) => !cat.includes("external_agent_benchmarks"))
    .forEach(([category, tasks]) => {
      console.log(
        `  ${chalk.cyan(category)} ${chalk.dim(`(${tasks.length} evals)`)}`,
      );
    });

  console.log(chalk.magenta.underline("\nBenchmarks"));
  Object.keys(config.benchmarks).forEach((name) => {
    const shorthand = `b:${name}`;
    console.log(
      `  ${chalk.cyan(shorthand.padEnd(20))} ${chalk.dim(`benchmark:${name}`)}`,
    );
  });

  if (args.includes("--detailed") || args.includes("-d")) {
    console.log(chalk.magenta.underline("\n\nDetailed Task List"));
    categories.forEach((tasks, category) => {
      if (!category.includes("external_agent_benchmarks")) {
        console.log(chalk.cyan(`\n${category}:`));
        tasks.forEach((task) => {
          console.log(`  - ${task}`);
        });
      }
    });
  } else {
    console.log(
      chalk.yellow(
        "\n💡 Tip: Use 'evals list --detailed' to see all individual tasks",
      ),
    );
  }
}

function parseArgs(rawArgs: string[]): {
  options: Record<string, string | number | boolean>;
  target?: string;
  filters: Array<[string, string]>;
} {
  const options: Record<string, string | number | boolean> = {};
  const filters: Array<[string, string]> = [];
  let target: string | undefined;

  for (let i = 0; i < rawArgs.length; i++) {
    const arg = rawArgs[i];

    if (arg.startsWith("-")) {
      // Handle options
      const flagName = arg.replace(/^--?/, "");

      // Map short flags to long names
      const flagMap: Record<string, string> = {
        e: "env",
        t: "trials",
        c: "concurrency",
        m: "model",
        p: "provider",
        l: "limit",
        s: "sample",
        f: "filter",
      };

      const optionName = flagMap[flagName] || flagName;

      if (optionName === "api") {
        options.api = true;
      } else if (optionName === "filter") {
        // Parse filter as key=value
        const filterValue = rawArgs[++i];
        if (filterValue && filterValue.includes("=")) {
          const [key, value] = filterValue.split("=");
          filters.push([key, value]);
        }
      } else {
        // Get next value
        const value = rawArgs[++i];
        if (value && !value.startsWith("-")) {
          // Parse numbers
          if (
            ["trials", "concurrency", "limit", "sample"].includes(optionName)
          ) {
            options[optionName] = parseInt(value, 10);
          } else {
            options[optionName] = value;
          }
        }
      }
    } else if (!target) {
      target = arg;
    }
  }

  return { options, target, filters };
}

function handleRun(args: string[]): void {
  const config = loadConfig();
  const { options, target, filters } = parseArgs(args);

  // Merge with defaults
  const stagehandTarget = (process.env.STAGEHAND_BROWSER_TARGET ?? "")
    .toLowerCase()
    .trim();
  if (
    !options.env &&
    (stagehandTarget === "local" || stagehandTarget === "browserbase")
  ) {
    options.env = stagehandTarget;
  }
  const finalOptions = { ...config.defaults, ...options };

  // Build environment variables
  const env = { ...process.env };

  // Set core environment variables
  if (finalOptions.env === "browserbase") {
    env.EVAL_ENV = "BROWSERBASE";
  } else {
    env.EVAL_ENV = "LOCAL";
  }

  if (finalOptions.api) {
    env.USE_API = "true";
  }

  if (finalOptions.trials) {
    env.EVAL_TRIAL_COUNT = String(finalOptions.trials);
  }

  if (finalOptions.concurrency) {
    env.EVAL_MAX_CONCURRENCY = String(finalOptions.concurrency);
  }

  if (finalOptions.provider) {
    env.EVAL_PROVIDER = finalOptions.provider;
  }

  if (finalOptions.model) {
    env.EVAL_MODEL_OVERRIDE = finalOptions.model;
  }

  // Handle benchmark-specific options
  let evalName: string | undefined;
  let categoryFilter: string | undefined;

  if (target) {
    if (target.startsWith("b:") || target.startsWith("benchmark:")) {
      // Running a benchmark
      const benchmarkName = target.replace(/^(b:|benchmark:)/, "");

      if (!config.benchmarks[benchmarkName]) {
        console.error(chalk.red(`Error: Unknown benchmark "${benchmarkName}"`));
        console.log(
          chalk.dim(
            `Available benchmarks: ${Object.keys(config.benchmarks).join(", ")}`,
          ),
        );
        process.exit(1);
      }

      // Map to the actual eval name
      const benchmarkMap: Record<string, string> = {
        webbench: "agent/webbench",
        gaia: "agent/gaia",
        webvoyager: "agent/webvoyager",
        osworld: "agent/osworld",
        onlineMind2Web: "agent/onlineMind2Web",
        webtailbench: "agent/webtailbench",
      };

      evalName = benchmarkMap[benchmarkName];
      env.EVAL_DATASET = benchmarkName;

      // Set benchmark-specific options
      if (options.limit) {
        env.EVAL_MAX_K = String(options.limit);
        env[`EVAL_${benchmarkName.toUpperCase()}_LIMIT`] = String(
          options.limit,
        );
      }

      if (options.sample) {
        env[`EVAL_${benchmarkName.toUpperCase()}_SAMPLE`] = String(
          options.sample,
        );
      }

      // Apply filters
      filters.forEach(([key, value]) => {
        const envKey = `EVAL_${benchmarkName.toUpperCase()}_${key.toUpperCase()}`;
        env[envKey] = value;
      });
    } else if (target === "all") {
      // Run all evals (no filter)
    } else if (target.includes("/") || target.includes("*")) {
      // Pattern matching - treat as eval name
      evalName = target;
    } else {
      // Check if it's a category
      const categories = new Set<string>();
      config.tasks.forEach((task) => {
        task.categories.forEach((cat) => categories.add(cat));
      });

      if (categories.has(target)) {
        categoryFilter = target;
      } else {
        // Assume it's a specific eval name
        evalName = target;
      }
    }
  }

  // Build the legacy command
  const legacyArgs: string[] = [];

  if (evalName) {
    legacyArgs.push(`name=${evalName}`);
  } else if (categoryFilter) {
    legacyArgs.push("category", categoryFilter);
  }

  // Run the existing eval system with our environment
  console.log(chalk.blue.bold("\nRunning evals...\n"));

  // Build first if needed
  const buildChild = spawn("pnpm", ["run", "build"], {
    stdio: "inherit",
    shell: true,
  });

  buildChild.on("exit", (buildCode) => {
    if (buildCode !== 0) {
      process.exit(buildCode || 1);
    }

    const compiledEvalPath = path.resolve(
      moduleDir,
      "..",
      "esm",
      "index.eval.js",
    );
    // When built to packages/evals/dist/cli/cli.js, moduleDir is packages/evals/dist/cli/
    // Source is at packages/evals/index.eval.ts from repo root
    const sourceEvalPath = path.resolve(
      moduleDir,
      "..",
      "..",
      "packages",
      "evals",
      "index.eval.ts",
    );

    let child;

    if (fs.existsSync(compiledEvalPath)) {
      child = spawn(process.execPath, [compiledEvalPath, ...legacyArgs], {
        env,
        stdio: "inherit",
        shell: true,
      });
    } else {
      let tsxCliPath: string | undefined;
      try {
        // Resolve the local tsx CLI entry within this package installation
        // This avoids requiring a globally installed tsx binary
        tsxCliPath = require.resolve("tsx/dist/cli.js");
      } catch {
        // no-op; will fall back to shell-resolved "tsx" if not found
      }

      const tsxArgs = [sourceEvalPath, ...legacyArgs];

      if (tsxCliPath) {
        child = spawn(process.execPath, [tsxCliPath, ...tsxArgs], {
          env,
          stdio: "inherit",
          shell: true,
        });
      } else {
        child = spawn("tsx", tsxArgs, {
          env,
          stdio: "inherit",
          shell: true,
        });
      }
    }

    child.on("exit", (code) => {
      process.exit(code || 0);
    });

    // Forward SIGINT (Ctrl+C) and SIGTERM to child process
    process.on("SIGINT", () => {
      console.log("\n\nReceived SIGINT, killing child process...");
      child.kill("SIGINT");
      setTimeout(() => {
        child.kill("SIGKILL");
        process.exit(130);
      }, 1000);
    });

    process.on("SIGTERM", () => {
      console.log("\n\nReceived SIGTERM, killing child process...");
      child.kill("SIGTERM");
      setTimeout(() => {
        child.kill("SIGKILL");
        process.exit(143);
      }, 1000);
    });
  });
}

// Main CLI logic
function main(): void {
  const args = process.argv.slice(2);
  const command = args[0];
  const commandArgs = args.slice(1);

  switch (command) {
    case "run":
      handleRun(commandArgs);
      break;

    case "list":
      handleList(commandArgs);
      break;

    case "config":
      handleConfig(commandArgs);
      break;

    case "help":
    case "--help":
    case "-h":
      printHelp();
      break;

    case undefined:
      console.error(chalk.red("Error: No command specified"));
      printHelp();
      process.exit(1);
      break;

    default:
      // Check if it's a direct target (backward compatibility)
      if (!command.startsWith("-")) {
        handleRun(args);
      } else {
        console.error(chalk.red(`Error: Unknown command "${command}"`));
        printHelp();
        process.exit(1);
      }
  }
}

// Run the CLI
main();


================================================
FILE: packages/evals/datasets/gaia/GAIA_web.jsonl
================================================
{"task_id": "e1fc63a2-da7a-432f-be78-7c4a95598703", "Level": 1, "Final answer": "17", "id": "level1-0", "web": "https://www.google.com/", "ques": "If Eliud Kipchoge could maintain his record-making marathon pace indefinitely, how many thousand hours would it take him to run the distance between the Earth and the Moon its closest approach? Please use the minimum perigee value on the Wikipedia page for the Moon when carrying out your calculation. Round your result to the nearest 1000 hours and do not use any comma separators if necessary."}
{"task_id": "8e867cd7-cff9-4e6c-867a-ff5ddc2550be", "Level": 1, "Final answer": "3", "id": "level1-1", "web": "https://www.google.com/", "ques": "How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia."}
{"task_id": "5d0080cb-90d7-4712-bc33-848150e917d3", "Level": 1, "Final answer": "0.1777", "id": "level1-2", "web": "https://www.google.com/", "ques": "What was the volume in m^3 of the fish bag that was calculated in the University of Leicester paper \"Can Hiccup Supply Enough Fish to Maintain a Dragon\u2019s Diet?\""}
{"task_id": "a1e91b78-d3d8-4675-bb8d-62741b4b68a6", "Level": 1, "Final answer": "3", "id": "level1-3", "web": "https://www.google.com/", "ques": "In the video https://www.youtube.com/watch?v=L1vXCYZAYYM, what is the highest number of bird species to be on camera simultaneously?"}
{"task_id": "46719c30-f4c3-4cad-be07-d5cb21eee6bb", "Level": 1, "Final answer": "Mapping Human Oriented Information to Software Agents for Online Systems Usage", "id": "level1-4", "web": "https://www.google.com/", "ques": "Of the authors (First M. Last) that worked on the paper \"Pie Menus or Linear Menus, Which Is Better?\" in 2015, what was the title of the first paper authored by the one that had authored prior papers?"}
{"task_id": "4b6bb5f7-f634-410e-815d-e673ab7f8632", "Level": 1, "Final answer": "THE CASTLE", "id": "level1-5", "web": "https://www.google.com/", "ques": "In Series 9, Episode 11 of Doctor Who, the Doctor is trapped inside an ever-shifting maze. What is this location called in the official script for the episode? Give the setting exactly as it appears in the first scene heading."}
{"task_id": "b816bfce-3d80-4913-a07d-69b752ce6377", "Level": 1, "Final answer": "fluffy", "id": "level1-6", "web": "https://www.google.com/", "ques": "In Emily Midkiff's June 2014 article in a journal named for the one of Hreidmar's sons that guarded his house, what word was quoted from two different authors in distaste for the nature of dragon depictions?"}
{"task_id": "72e110e7-464c-453c-a309-90a95aed6538", "Level": 1, "Final answer": "Guatemala", "id": "level1-7", "web": "https://www.google.com/", "ques": "Under DDC 633 on Bielefeld University Library's BASE, as of 2020, from what country was the unknown language article with a flag unique from the others?"}
{"task_id": "b415aba4-4b68-4fc6-9b89-2c812e55a3e1", "Level": 1, "Final answer": "diamond", "id": "level1-8", "web": "https://www.google.com/", "ques": "In Nature journal's Scientific Reports conference proceedings from 2012, in the article that did not mention plasmons or plasmonics, what nano-compound is studied? Don't use the prefix nano in your answer if there is one."}
{"task_id": "935e2cff-ae78-4218-b3f5-115589b19dae", "Level": 1, "Final answer": "research", "id": "level1-9", "web": "https://www.google.com/", "ques": "In the year 2022, and before December, what does \"R\" stand for in the three core policies of the type of content that was violated in the public logs on the Legume Wikipedia page?"}
{"task_id": "4fc2f1ae-8625-45b5-ab34-ad4433bc21f8", "Level": 1, "Final answer": "FunkMonk", "id": "level1-10", "web": "https://www.google.com/", "ques": "Who nominated the only Featured Article on English Wikipedia about a dinosaur that was promoted in November 2016?"}
{"task_id": "5188369a-3bbe-43d8-8b94-11558f909a08", "Level": 1, "Final answer": "Annie Levin", "id": "level1-11", "web": "https://www.google.com/", "ques": "What writer is quoted by Merriam-Webster for the Word of the Day from June 27, 2022?"}
{"task_id": "9d191bce-651d-4746-be2d-7ef8ecadb9c2", "Level": 1, "Final answer": "Extremely", "id": "level1-12", "web": "https://www.google.com/", "ques": "Examine the video at https://www.youtube.com/watch?v=1htKBjuUWec.\n\nWhat does Teal'c say in response to the question \"Isn't that hot?\""}
{"task_id": "cabe07ed-9eca-40ea-8ead-410ef5e83f91", "Level": 1, "Final answer": "Louvrier", "id": "level1-13", "web": "https://www.google.com/", "ques": "What is the surname of the equine veterinarian mentioned in 1.E Exercises from the chemistry materials licensed by Marisa Alviar-Agnew & Henry Agnew under the CK-12 license in LibreText's Introductory Chemistry materials as compiled 08/21/2023?"}
{"task_id": "d0633230-7067-47a9-9dbf-ee11e0a2cdd6", "Level": 1, "Final answer": "BaseLabelPropagation", "id": "level1-14", "web": "https://www.google.com/", "ques": "In the Scikit-Learn July 2017 changelog, what other predictor base command received a bug fix? Just give the name, not a path."}
{"task_id": "0383a3ee-47a7-41a4-b493-519bdefe0488", "Level": 1, "Final answer": "Rockhopper penguin", "id": "level1-15", "web": "https://www.google.com/", "ques": "On the BBC Earth YouTube video of the Top 5 Silliest Animal Moments, what species of bird is featured?"}
{"task_id": "11af4e1a-5f45-467d-9aeb-46f4bb0bf034", "Level": 1, "Final answer": "6", "id": "level1-16", "web": "https://www.google.com/", "ques": "How many more blocks (also denoted as layers) in BERT base encoder than the encoder from the architecture proposed in Attention is All You Need?"}
{"task_id": "7673d772-ef80-4f0f-a602-1bf4485c9b43", "Level": 1, "Final answer": "inference", "id": "level1-17", "web": "https://www.google.com/", "ques": "On Cornell Law School website's legal information institute, under the fifth section of federal rules alphabetically, what word was deleted in the last amendment to the first rule in the article that has \"witnesses\" in the most titles as of 2021?"}
{"task_id": "c365c1c7-a3db-4d5e-a9a1-66f56eae7865", "Level": 1, "Final answer": "Braintree, Honolulu", "id": "level1-18", "web": "https://www.google.com/", "ques": "Of the cities within the United States where U.S. presidents were born, which two are the farthest apart from the westernmost to the easternmost going east, giving the city names only? Give them to me in alphabetical order, in a comma-separated list"}
{"task_id": "7d4a7d1d-cac6-44a8-96e8-ea9584a70825", "Level": 1, "Final answer": "22", "id": "level1-19", "web": "https://www.google.com/", "ques": "According to Girls Who Code, how long did it take in years for the percentage of computer scientists that were women to change by 13% from a starting point of 37%?"}
{"task_id": "dc22a632-937f-4e6a-b72f-ba0ff3f5ff97", "Level": 1, "Final answer": "Five Hundred Things To Eat Before It's Too Late: and the Very Best Places to Eat Them", "id": "level1-20", "web": "https://www.google.com/", "ques": "What was the complete title of the book in which two James Beard Award winners recommended the restaurant where Ali Khan enjoyed a New Mexican staple in his cost-conscious TV show that started in 2015? Write the numbers in plain text if there are some in the title."}
{"task_id": "3f57289b-8c60-48be-bd80-01f8099ca449", "Level": 1, "Final answer": "519", "id": "level1-21", "web": "https://www.google.com/", "ques": "How many at bats did the Yankee with the most walks in the 1977 regular season have that same season?"}
{"task_id": "23dd907f-1261-4488-b21c-e9185af91d5e", "Level": 1, "Final answer": "2", "id": "level1-22", "web": "https://www.google.com/", "ques": "In Audre Lorde\u2019s poem \u201cFather Son and Holy Ghost\u201d, what is the number of the stanza in which some lines are indented?"}
{"task_id": "840bfca7-4f7b-481a-8794-c560c340185d", "Level": 1, "Final answer": "80GSFC21M0002", "id": "level1-23", "web": "https://www.google.com/", "ques": "On June 6, 2023, an article by Carolyn Collins Petersen was published in Universe Today. This article mentions a team that produced a paper about their observations, linked at the bottom of the article. Find this paper. Under what NASA award number was the work performed by R. G. Arendt supported by?"}
{"task_id": "a0068077-79f4-461a-adfe-75c1a4148545", "Level": 1, "Final answer": "90", "id": "level1-24", "web": "https://www.google.com/", "ques": "What was the actual enrollment count of the clinical trial on H. pylori in acne vulgaris patients from Jan-May 2018 as listed on the NIH website?"}
{"task_id": "bda648d7-d618-4883-88f4-3466eabd860e", "Level": 1, "Final answer": "Saint Petersburg", "id": "level1-25", "web": "https://www.google.com/", "ques": "Where were the Vietnamese specimens described by Kuznetzov in Nedoshivina's 2010 paper eventually deposited? Just give me the city name without abbreviations."}
{"task_id": "c61d22de-5f6c-4958-a7f6-5e9707bd3466", "Level": 2, "Final answer": "egalitarian", "id": "level2-0", "web": "https://www.google.com/", "ques": "A paper about AI regulation that was originally submitted to arXiv.org in June 2022 shows a figure with three axes, where each axis has a label word at both ends. Which of these words is used to describe a type of society in a Physics and Society article submitted to arXiv.org on August 11, 2016?"}
{"task_id": "17b5a6a3-bc87-42e8-b0fb-6ab0781ef2cc", "Level": 2, "Final answer": "34689", "id": "level2-1", "web": "https://www.google.com/", "ques": "I\u2019m researching species that became invasive after people who kept them as pets released them. There\u2019s a certain species of fish that was popularized as a pet by being the main character of the movie Finding Nemo. According to the USGS, where was this fish found as a nonnative species, before the year 2020? I need the answer formatted as the five-digit zip codes of the places the species was found, separated by commas if there is more than one place."}
{"task_id": "04a04a9b-226c-43fd-b319-d5e89743676f", "Level": 2, "Final answer": "41", "id": "level2-2", "web": "https://www.google.com/", "ques": "If we assume all articles published by Nature in 2020 (articles, only, not book reviews/columns, etc) relied on statistical significance to justify their findings and they on average came to a p-value of 0.04, how many papers would be incorrect as to their claims of statistical significance? Round the value up to the next integer."}
{"task_id": "14569e28-c88c-43e4-8c32-097d35b9a67d", "Level": 2, "Final answer": "backtick", "id": "level2-3", "web": "https://www.google.com/", "ques": "In Unlambda, what exact charcter or text needs to be added to correct the following code to output \"For penguins\"? If what is needed is a character, answer with the name of the character. If there are different names for the character, use the shortest. The text location is not needed. Code:\n\n`r```````````.F.o.r. .p.e.n.g.u.i.n.si"}
{"task_id": "3627a8be-a77f-41bb-b807-7e1bd4c0ebdf", "Level": 2, "Final answer": "142", "id": "level2-4", "web": "https://www.google.com/", "ques": "The object in the British Museum's collection with a museum number of 2012,5015.17 is the shell of a particular mollusk species. According to the abstract of a research article published in Science Advances in 2021, beads made from the shells of this species were found that are at least how many thousands of years old?"}
{"task_id": "7619a514-5fa8-43ef-9143-83b66a43d7a4", "Level": 2, "Final answer": "04/15/18", "id": "level2-5", "web": "https://www.google.com/", "ques": "According to github, when was Regression added to the oldest closed numpy.polynomial issue that has the Regression label in MM/DD/YY?"}
{"task_id": "2a649bb1-795f-4a01-b3be-9a01868dae73", "Level": 2, "Final answer": "3.1.3.1; 1.11.1.7", "id": "level2-6", "web": "https://www.google.com/", "ques": "What are the EC numbers of the two most commonly used chemicals for the virus testing method in the paper about SPFMV and SPCSV in the Pearl Of Africa from 2016? Return the semicolon-separated numbers in the order of the alphabetized chemicals."}
{"task_id": "87c610df-bef7-4932-b950-1d83ef4e282b", "Level": 2, "Final answer": "Morarji Desai", "id": "level2-7", "web": "https://www.google.com/", "ques": "In April of 1977, who was the Prime Minister of the first place mentioned by name in the Book of Esther (in the New International Version)?"}
{"task_id": "624cbf11-6a41-4692-af9c-36b3e5ca3130", "Level": 2, "Final answer": "So we had to let it die.", "id": "level2-8", "web": "https://www.google.com/", "ques": "What's the last line of the rhyme under the flavor name on the headstone visible in the background of the photo of the oldest flavor's headstone in the Ben & Jerry's online flavor graveyard as of the end of 2022?"}
{"task_id": "dd3c7503-f62a-4bd0-9f67-1b63b94194cc", "Level": 2, "Final answer": "6", "id": "level2-9", "web": "https://www.google.com/", "ques": "Use density measures from the chemistry materials licensed by Marisa Alviar-Agnew & Henry Agnew under the CK-12 license in LibreText's Introductory Chemistry materials as compiled 08/21/2023.\n\nI have a gallon of honey and a gallon of mayonnaise at 25C. I remove one cup of honey at a time from the gallon of honey. How many times will I need to remove a cup to have the honey weigh less than the mayonaise? Assume the containers themselves weigh the same."}
{"task_id": "f0f46385-fc03-4599-b5d3-f56496c3e69f", "Level": 2, "Final answer": "Indonesia, Myanmar", "id": "level2-10", "web": "https://www.google.com/", "ques": "In terms of geographical distance between capital cities, which 2 countries are the furthest from each other within the ASEAN bloc according to wikipedia? Answer using a comma separated list, ordering the countries by alphabetical order."}
{"task_id": "e4e91f1c-1dcd-439e-9fdd-cb976f5293fd", "Level": 2, "Final answer": "cloak", "id": "level2-11", "web": "https://www.google.com/", "ques": "I need to fact-check a citation. This is the citation from the bibliography:\n\nGreetham, David. \"Uncoupled: OR, How I Lost My Author(s).\" Textual Cultures: Texts, Contexts, Interpretation, vol. 3 no. 1, 2008, p. 45-46. Project MUSE, doi:10.2979/tex.2008.3.1.44.\n\nAnd this is the in-line citation:\n\nOur relationship with the authors of the works we read can often be \u201cobscured not by a \"cloak of print\" but by the veil of scribal confusion and mis-transmission\u201d (Greetham 45-46).\n\nDoes the quoted text match what is actually in the article? If Yes, answer Yes, otherwise, give me the word in my citation that does not match with the correct one (without any article)."}
{"task_id": "56137764-b4e0-45b8-9c52-1866420c3df5", "Level": 2, "Final answer": "Li Peng", "id": "level2-12", "web": "https://www.google.com/", "ques": "Which contributor to the version of OpenCV where support was added for the Mask-RCNN model has the same name as a former Chinese head of government when the names are transliterated to the Latin alphabet?"}
{"task_id": "8b3379c0-0981-4f5b-8407-6444610cb212", "Level": 2, "Final answer": "1.8", "id": "level2-13", "web": "https://www.google.com/", "ques": "What is the maximum length in meters of #9 in the first National Geographic short on YouTube that was ever released according to the Monterey Bay Aquarium website? Just give the number."}
{"task_id": "0ff53813-3367-4f43-bcbd-3fd725c1bf4b", "Level": 2, "Final answer": "beta geometric", "id": "level2-14", "web": "https://www.google.com/", "ques": "What two-word type of model did Manash Pratim Kashyap's and PS Fader's studies in customer retention studies published during 2018-2019 have in common (no punctuation)?"}
{"task_id": "a7feb290-76bb-4cb7-8800-7edaf7954f2f", "Level": 2, "Final answer": "31", "id": "level2-15", "web": "https://www.google.com/", "ques": "How many High Energy Physics - Lattice articles listed in January 2020 on Arxiv had ps versions available?"}
{"task_id": "b4cc024b-3f5e-480e-b96a-6656493255b5", "Level": 2, "Final answer": "Russian-German Legion", "id": "level2-16", "web": "https://www.google.com/", "ques": "The photograph in the Whitney Museum of American Art's collection with accession number 2022.128 shows a person holding a book. Which military unit did the author of this book join in 1813? Answer without using articles."}
{"task_id": "33d8ea3b-6c6b-4ff1-803d-7e270dea8a57", "Level": 2, "Final answer": "2", "id": "level2-17", "web": "https://www.google.com/", "ques": "What is the minimum number of page links a person must click on to go from the english Wikipedia page on The Lord of the Rings (the book) to the english Wikipedia page on A Song of Ice and Fire (the book series)? In your count, include each link you would click on to get to the page. Use the pages as they appeared at the end of the day on July 3, 2023."}
{"task_id": "e8cb5b03-41e0-4086-99e5-f6806cd97211", "Level": 2, "Final answer": "shrimp", "id": "level2-18", "web": "https://www.google.com/", "ques": "I went to Virtue restaurant & bar in Chicago for my birthday on March 22, 2021 and the main course I had was delicious!  Unfortunately, when I went back about a month later on April 21, it was no longer on the dinner menu.  Using the Wayback Machine, can you help me figure out which main course was on the dinner menu for Virtue on March 22, 2021 but not April 21, 2021? Answer using the singular form, without articles."}
{"task_id": "f46b4380-207e-4434-820b-f32ce04ae2a4", "Level": 2, "Final answer": "Harbinger, Tidal", "id": "level2-19", "web": "https://www.google.com/", "ques": "It is 1999. Before you party like it is 1999, please assist me in settling a bet.\n\nFiona Apple and Paula Cole released albums prior to 1999. Of these albums, which didn't receive a letter grade from Robert Christgau? Provide your answer as a comma delimited list of album titles, sorted alphabetically."}
{"task_id": "05407167-39ec-4d3a-a234-73a9120c325d", "Level": 2, "Final answer": "Format Document", "id": "level2-20", "web": "https://www.google.com/", "ques": "In the 2018 VSCode blog post on replit.com, what was the command they clicked on in the last video to remove extra lines?"}
{"task_id": "b9763138-c053-4832-9f55-86200cb1f99c", "Level": 2, "Final answer": "3", "id": "level2-21", "web": "https://www.google.com/", "ques": "Compute the check digit the Tropicos ID for the Order Helotiales would have if it were an ISBN-10 number."}
{"task_id": "16d825ff-1623-4176-a5b5-42e0f5c2b0ac", "Level": 2, "Final answer": "6:41 PM", "id": "level2-22", "web": "https://www.google.com/", "ques": "What time was the Tri-Rail train that carried the most passengers on May 27, 2019 scheduled to arrive in Pompano Beach? Express your answer in the 12-hour digital clock format without leading zero if any, and include whether it is AM or PM."}
{"task_id": "544b7f0c-173a-4377-8d56-57b36eb26ddf", "Level": 2, "Final answer": "A Nightmare on Elm Street", "id": "level2-23", "web": "https://www.google.com/", "ques": "In Valentina Re\u2019s contribution to the 2017 book \u201cWorld Building: Transmedia, Fans, Industries\u201d, what horror movie does the author cite as having popularized metalepsis between a dream world and reality? Use the complete name with article if any."}
{"task_id": "6b078778-0b90-464d-83f6-59511c811b01", "Level": 2, "Final answer": "Alfonso Visconti", "id": "level2-24", "web": "https://www.google.com/", "ques": "The Metropolitan Museum of Art has a portrait in its collection with an accession number of 29.100.5. Of the consecrators and co-consecrators of this portrait's subject as a bishop, what is the name of the one who never became pope?"}
{"task_id": "08cae58d-4084-4616-b6dd-dd6534e4825b", "Level": 2, "Final answer": "2018", "id": "level2-25", "web": "https://www.google.com/", "ques": "According to Google Finance, when was the first year the Apple stock went above $50 (without adjusting for stock split)?"}
{"task_id": "2dfc4c37-fec1-4518-84a7-10095d30ad75", "Level": 2, "Final answer": "6", "id": "level2-26", "web": "https://www.google.com/", "ques": "According to Box Office Mojo's 2020 Worldwide Box Office list, how many of the top 10 highest-grossing worldwide movies are also on the top 10 highest-grossing domestic movies? Your answer should be a numerical integer value."}
{"task_id": "9f41b083-683e-4dcf-9185-ccfeaa88fa45", "Level": 2, "Final answer": "0", "id": "level2-27", "web": "https://www.google.com/", "ques": "How many pages if the 2023 IPCC report (85 pages version) mentions nuclear energy?"}
{"task_id": "ecbc4f94-95a3-4cc7-b255-6741a458a625", "Level": 2, "Final answer": "13", "id": "level2-28", "web": "https://www.google.com/", "ques": "How many images are there in the latest 2022 Lego english wikipedia article?"}
{"task_id": "71345b0a-9c7d-4b50-b2bf-937ec5879845", "Level": 2, "Final answer": "Here be dragons", "id": "level2-29", "web": "https://www.google.com/", "ques": "On a leap day before the year 2008, a joke was removed from the Wikipedia page for \u201cDragon\u201d. What was the phrase that was removed? Give the phrase as it appeared on the page, but without punctuation."}
{"task_id": "7b5377b0-3f38-4103-8ad2-90fe89864c04", "Level": 2, "Final answer": "563.9", "id": "level2-30", "web": "https://www.google.com/", "ques": "Find the value of x to the nearest tenth: Lx = (d/dx * (A * x-squared)) + 4-thousand'n'ninety-7 minus C\nWhere L is the last two digits of the year of the Venezuelan Declaration of Independence,\nA is the number of colors in the TikTok logo as of July 2023, excluding black and white,\nand C is the height of the average woman in the Philippines according to a July 2023 Business Insider article, rounded to the nearest whole centimeter"}
{"task_id": "114d5fd0-e2ae-4b6d-a65a-870da2d19c08", "Level": 2, "Final answer": "4", "id": "level2-31", "web": "https://www.google.com/", "ques": "In the endnote found in the second-to-last paragraph of page 11 of the book with the doi 10.2307/j.ctv9b2xdv, what date in November was the Wikipedia article accessed? Just give the day of the month."}
{"task_id": "ad37a656-079a-49f9-a493-7b739c9167d1", "Level": 2, "Final answer": "Bravo", "id": "level2-32", "web": "https://www.google.com/", "ques": "On July 15, 2008, Phys.org published an article about a catastrophe. Find the explosive force of this catastrophe according to Encyclopedia Britannica, then find the name of the US nuclear test that had the same yield. Your answer should only be the last word of the name of the test."}
{"task_id": "f3917a3d-1d17-4ee2-90c5-683b072218fe", "Level": 2, "Final answer": "2732", "id": "level2-33", "web": "https://www.google.com/", "ques": "How many edits were made to the Wikipedia page on Antidisestablishmentarianism from its inception until June of 2023?"}
{"task_id": "48eb8242-1099-4c26-95d4-ef22b002457a", "Level": 2, "Final answer": "6", "id": "level2-34", "web": "https://www.google.com/", "ques": "How many nonindigenous crocodiles were found in Florida from the year 2000 through 2020? You can get the data from the USGS Nonindigenous Aquatic Species database."}
{"task_id": "c8b7e059-c60d-472e-ad64-3b04ae1166dc", "Level": 2, "Final answer": "8", "id": "level2-35", "web": "https://www.google.com/", "ques": "The work referenced in footnote 397 of Federico Lauria's 2014 dissertation is also the source for the titles of two paintings in the Smithsonian American Art Museum's collection, as of August 2023. What is the absolute difference between the chapter numbers of the chapters that the titles of these two paintings quote?"}
{"task_id": "d1af70ea-a9a4-421a-b9cc-94b5e02f1788", "Level": 2, "Final answer": "736455", "id": "level2-36", "web": "https://www.google.com/", "ques": "As of the 2020 census, what was the population difference between the largest county seat and smallest county seat, by land area of the county seat, in Washington state? For population figures, please use the official data from data.census.gov. Please report the integer difference."}
{"task_id": "ded28325-3447-4c56-860f-e497d6fb3577", "Level": 2, "Final answer": "Picnic is in Ploybius Plaza.", "id": "level2-37", "web": "https://www.google.com/", "ques": "This is a secret message my friend gave me. It says where we should meet for our picnic on Friday. The only problem is, it\u2019s encrypted in the Caesar cipher, so I can\u2019t read it. Can you tell me what it says? This is the message:\n\nZsmxsm sc sx Zyvilsec Zvkjk."}
{"task_id": "d700d50d-c707-4dca-90dc-4528cddd0c80", "Level": 2, "Final answer": "Roger Miller", "id": "level2-38", "web": "https://www.google.com/", "ques": "Who composed the song that was performed by a rooster and a hamster in separate animated videos at separate tempos with different lyrics? Answer using the format First name Last name."}
{"task_id": "0a3cd321-3e76-4622-911b-0fda2e5d6b1a", "Level": 2, "Final answer": "Brunei, China, Morocco, Singapore", "id": "level2-39", "web": "https://www.google.com/", "ques": "According to the World Bank, which countries had gross savings of over 35% of GDP for every year in the period 2001-2010? Give your answer as a comma-separated list of countries in alphabetical order. Use the countries most common names in english when answering."}
{"task_id": "f2feb6a4-363c-4c09-a804-0db564eafd68", "Level": 2, "Final answer": "900000", "id": "level2-40", "web": "https://www.google.com/", "ques": "I\u2019m thinking about selling my home, so I want to learn more about how homes in my area sold recently. I live in Pearl City, Hawaii, which is on the island of Oahu. I know two homes near me that sold in 2022 were 2072 Akaikai Loop, and 2017 Komo Mai Drive. Find which of those homes sold for more in 2022, and tell me how much it sold for. Don\u2019t put commas or decimal places in the answer."}
{"task_id": "0b260a57-3f3a-4405-9f29-6d7a1012dbfb", "Level": 2, "Final answer": "0.269", "id": "level2-41", "web": "https://www.google.com/", "ques": "On ScienceDirect, what is the difference to 3 decimal places in the sample standard deviations of the number of Reference Works in each Life Science domain compared to Health Sciences as of 2022?"}
{"task_id": "ed58682d-bc52-4baa-9eb0-4eb81e1edacc", "Level": 2, "Final answer": "stare", "id": "level2-42", "web": "https://www.google.com/", "ques": "What is the last word before the second chorus of the King of Pop's fifth single from his sixth studio album?"}
{"task_id": "023e9d44-96ae-4eed-b912-244ee8c3b994", "Level": 2, "Final answer": "8", "id": "level2-43", "web": "https://www.google.com/", "ques": "It's May 2023, and I'm about to drive across the U.S. from California to Maine. I always recycle my water bottles at the end of a trip, and I drink 5 12-ounce water bottles for every 100 miles I travel, rounded to the nearest 100. Assuming I follow I-40 from Los Angeles to Cincinnati, then take I-90 from Cincinnati to Augusta, how many dollars will I get back according to Wikipedia?"}
{"task_id": "0e9e85b8-52b9-4de4-b402-5f635ab9631f", "Level": 2, "Final answer": "1927", "id": "level2-44", "web": "https://www.google.com/", "ques": "What is the latest chronological year date written in the image on the webpage found when following the first citation reference link on the latest version of Carl Nebel's Wikipedia page as of August 2023?"}
{"task_id": "20194330-9976-4043-8632-f8485c6c71b2", "Level": 2, "Final answer": "4", "id": "level2-45", "web": "https://www.google.com/", "ques": "The YouTube channel Game Grumps began a Let\u2019s Play of the game Sonic the Hedgehog (2006) in the year 2012. Thirty seconds into the first episode, a phrase is shown on the screen in white letters on a red background. How many times does the letter \"E\" appear in this phrase?"}
{"task_id": "65638e28-7f37-4fa7-b7b9-8c19bb609879", "Level": 2, "Final answer": "Kleinpaul", "id": "level2-46", "web": "https://www.google.com/", "ques": "The book with the doi 10.1353/book.24372 concerns a certain neurologist. According to chapter 2 of the book, what author influenced this neurologist\u2019s belief in \u201cendopsychic myths\u201d? Give the last name only."}
{"task_id": "3ff6b7a9-a5bd-4412-ad92-0cd0d45c0fee", "Level": 2, "Final answer": "56000", "id": "level2-47", "web": "https://www.google.com/", "ques": "The longest-lived vertebrate is named after an island.  According to Wikipedia as of January 1, 2021, what is the 2020 estimated population of that island, to the nearest thousand?"}
{"task_id": "708b99c5-e4a7-49cb-a5cf-933c8d46470d", "Level": 2, "Final answer": "Citations", "id": "level2-48", "web": "https://www.google.com/", "ques": "On the DeepFruits fruit detection graph on Connected Papers from 2016, what feature caused the largest bubble to be the size it is?"}
{"task_id": "0a65cb96-cb6e-4a6a-8aae-c1084f613456", "Level": 2, "Final answer": "Holabird", "id": "level2-49", "web": "https://www.google.com/", "ques": "During the first week of August 2015, one of the NASA Astronomy Pictures of the Day shows the lights of a city on the horizon. The namesake of this city also has a landmark building in Chicago named after him. What is the name of the architectural firm that designed this landmark building? Give the first name appearing in the name of the firm as of June 2023."}
{"task_id": "65da0822-a48a-4a68-bbad-8ed1b835a834", "Level": 2, "Final answer": "Santa Clara, Boston", "id": "level2-50", "web": "https://www.google.com/", "ques": "All of the individuals who formally held the position of United States secretary of homeland security prior to April 2019, excluding those who held the position in an acting capacity, have a bachelor's degree. Of the universities that these bachelor's degrees were from, which is the westernmost university and which is the easternmost university? Give them to me as a comma-separated list, I only want the name of the cities where the universities are located, with the westernmost city listed first."}
{"task_id": "73c1b9fe-ee1d-4cf4-96ca-35c08f97b054", "Level": 2, "Final answer": "1954", "id": "level2-51", "web": "https://www.google.com/", "ques": "According to the USGS, in what year was the American Alligator first found west of Texas (not including Texas)?"}
{"task_id": "e2d69698-bc99-4e85-9880-67eaccd66e6c", "Level": 2, "Final answer": "Michele Fitzgerald", "id": "level2-52", "web": "https://www.google.com/", "ques": "As of August 2023, who is the only winner of the US version of Survivor to be born in the month of May?"}
{"task_id": "a56f1527-3abf-41d6-91f8-7296d6336c3f", "Level": 2, "Final answer": "185", "id": "level2-53", "web": "https://www.google.com/", "ques": "The cover of the August 2021 issue of Vogue shows a famous landmark in the background behind some trees. How tall is this monument in yards, rounded to the nearest yard? Give the number only."}
{"task_id": "42d4198c-5895-4f0a-b0c0-424a66465d83", "Level": 2, "Final answer": "60", "id": "level2-54", "web": "https://www.google.com/", "ques": "I'm curious about how much information is available for popular video games before their release. Find the Wikipedia page for the 2019 game that won the British Academy Games Awards. How many revisions did that page have before the month listed as the game's release date on that Wikipedia page (as of the most recent entry from 2022)?"}
{"task_id": "a26649c6-1cb2-470a-871e-6910c64c3e53", "Level": 2, "Final answer": "116", "id": "level2-55", "web": "https://www.google.com/", "ques": "What is the absolute difference in tens of thousands between the population of chinstrap penguins on the Wikipedia page for penguin species populations as of the end of 2018 and the population recorded in the Nature.com \"global population assessment of the Chinstrap penguin\" article from 2020, assuming two penguins per breeding pair?"}
{"task_id": "d5141ca5-e7a0-469f-bf3e-e773507c86e2", "Level": 2, "Final answer": "19/02/2009", "id": "level2-56", "web": "https://www.google.com/", "ques": "When was a picture of St. Thomas Aquinas first added to the Wikipedia page on the Principle of double effect? Answer using the format DD/MM/YYYY."}
{"task_id": "1dcc160f-c187-48c2-b68e-319bd4354f3d", "Level": 2, "Final answer": "3", "id": "level2-57", "web": "https://www.google.com/", "ques": "According to Openreview.net, at the NeurIPS 2022 Conference, how many papers by an author named Yuri were accepted with a \"certain\" recommendation?"}
{"task_id": "e0c10771-d627-4fd7-9694-05348e54ee36", "Level": 2, "Final answer": "234.9", "id": "level2-58", "web": "https://www.google.com/", "ques": "Take the gender split from the 2011 Bulgarian census about those who have completed tertiary education. Subtract the smaller number from the larger number, then return the difference in thousands of women. So if there were 30.1 thousand more men, you'd give \"30.1\""}
{"task_id": "e29834fd-413a-455c-a33e-c3915b07401c", "Level": 2, "Final answer": "21", "id": "level2-59", "web": "https://www.google.com/", "ques": "I'd like to learn more about some popular reality television competition shows. As of the end of the 44th season of the American version of Survivor, how many more unique winners have there been compared to the number of winners of American Idol?"}
{"task_id": "08c0b6e9-1b43-4c2e-ae55-4e3fce2c2715", "Level": 2, "Final answer": "orange, white", "id": "level2-60", "web": "https://www.google.com/", "ques": "In the film Goldfinger, what color was the object that James Bond concealed himself and his companion Pussy Galore at the end of the film? If there are multiple colors, put them in a comma-separated list in alphabetical order."}
{"task_id": "db4fd70a-2d37-40ea-873f-9433dc5e301f", "Level": 2, "Final answer": "10", "id": "level2-61", "web": "https://www.google.com/", "ques": "As of May 2023, how many stops are between South Station and Windsor Gardens on MBTA\u2019s Franklin-Foxboro line (not included)?"}
{"task_id": "853c8244-429e-46ca-89f2-addf40dfb2bd", "Level": 2, "Final answer": "11", "id": "level2-62", "web": "https://www.google.com/", "ques": "In the 2015 Metropolitan Museum of Art exhibition titled after the Chinese zodiac animal of 2015, how many of the \"twelve animals of the Chinese zodiac\" have a hand visible?"}
{"task_id": "7a4a336d-dcfa-45a0-b014-824c7619e8de", "Level": 2, "Final answer": "1:41.614", "id": "level2-63", "web": "https://www.google.com/", "ques": "At the two-minute mark in the YouTube video uploaded by the channel \u201cGameGrumps\u201d on May 14, 2017 as part of their playthrough of the game Mario Kart 8 Deluxe, the shows\u2019 hosts are competing on one of the game\u2019s racetracks. What was the world record time for that track in the game\u2019s 150cc mode as of June 7, 2023? Express your answer in minutes and seconds, rounding the seconds to the nearest hundredth, e.g. 1:01.001."}


================================================
FILE: packages/evals/datasets/onlineMind2Web/onlineMind2Web.jsonl
================================================
{"task_id": "b7258ee05d75e6c50673a59914db412e", "confirmed_task": "Find the store location and hours of the closest Gamestop to zip code 90028 and set it as the home store on Gamestop.", "website": "https://www.gamestop.com/", "reference_length": 8, "level": "medium"}
{"task_id": "ade4c09ad3fdb1607209750924cd232f", "confirmed_task": "Compare available plans for the AeroAPI on Flightaware.", "website": "https://www.flightaware.com/", "reference_length": 4, "level": "easy"}
{"task_id": "fb7b4f784cfde003e2548fdf4e8d6b4f", "confirmed_task": "Open the page with an overview of the submission of releases on Discogs.", "website": "https://www.discogs.com/", "reference_length": 6, "level": "medium"}
{"task_id": "824eb7bb0ef1ce40bfd49c12182d9428", "confirmed_task": "Get the lowest priced women's plus size one piece swimsuit in color black with a customer rating of at least 5 on Kohls.", "website": "https://www.kohls.com/", "reference_length": 13, "level": "hard"}
{"task_id": "046138801a05ddf56ad94e8672942496", "confirmed_task": "Find discussions of the community and open one with the most replies on Flightaware.", "website": "https://www.flightaware.com/", "reference_length": 6, "level": "medium"}
{"task_id": "92a3d4236f167af4afdc08876a902ba6", "confirmed_task": "Find a 2022 Tesla Model 3 on CarMax.", "website": "https://www.carmax.com/", "reference_length": 10, "level": "medium"}
{"task_id": "48c73f3f53e2611c4a1052457c1033db", "confirmed_task": "Get the report from the final environmental impact statement for the Jamaica Bus Depot expansion on new.mta.info.", "website": "https://new.mta.info/", "reference_length": 10, "level": "medium"}
{"task_id": "8f2611047de227a2ca8bda13f6e2e5fb", "confirmed_task": "Find the used 2012-2013 Honda Crosstour with the lowest mileage for under $25,000 near zip code 49102 on CarGurus.", "website": "https://www.cargurus.com/", "reference_length": 17, "level": "hard"}
{"task_id": "b320c68bffc1f3c7f2a8dc9d5478fb27", "confirmed_task": "Find a walkthrough for the game \"The Legend of Zelda: Breath of the Wild\" on ign.", "website": "https://www.ign.com/", "reference_length": 6, "level": "medium"}
{"task_id": "aa4b5cb7114fcc138ade82b4b9716d24", "confirmed_task": "Find an editor's choice review with a score of 10 in the boardgame category on ign.", "website": "https://www.ign.com/", "reference_length": 8, "level": "medium"}
{"task_id": "005be9dd91c95669d6ddde9ae667125c", "confirmed_task": "Find the weight of baggage allowance for economy class on Qatar Airways.", "website": "https://www.qatarairways.com/", "reference_length": 4, "level": "easy"}
{"task_id": "323bd85e3559655d89e5496b951a25e8", "confirmed_task": "Tell me information about what identification I need to bring on my trip on Amtrak.", "website": "https://www.amtrak.com/", "reference_length": 6, "level": "medium"}
{"task_id": "123e8c2fc453f55fadd1d0b9aaf94df4", "confirmed_task": "Browse used Audi cars made before 2015 and sort by lowest price on KBB.", "website": "https://www.kbb.com/", "reference_length": 8, "level": "medium"}
{"task_id": "56f8890a837c49f7df766b9c981646f3", "confirmed_task": "Show crazy credits for the movie \" Prometheus\" on IMDb.", "website": "https://www.imdb.com/", "reference_length": 6, "level": "medium"}
{"task_id": "644a856c3897665e475e0dce50bf217d", "confirmed_task": "Find a pair of wireless headphones on Amazon with active noise canceling for $100 or less and add them to the cart.", "website": "https://www.amazon.com/", "reference_length": 8, "level": "medium"}
{"task_id": "62f1626ce249c31098854f8b38bdd6cf", "confirmed_task": "Find Playstation 5 digital edition on gamestop.", "website": "https://www.gamestop.com/", "reference_length": 6, "level": "medium"}
{"task_id": "561693d6eec7bbfba3fefe9e4b26decb", "confirmed_task": "Browse Marriott Bonvoy credit cards on Marriott.", "website": "https://www.marriott.com/", "reference_length": 4, "level": "easy"}
{"task_id": "b7a9a6b5d451164c09bbd27b670bc2ae", "confirmed_task": "Show me the list of Men's Blazers, Black, Size M on Uniqlo.", "website": "https://www.uniqlo.com/", "reference_length": 11, "level": "hard"}
{"task_id": "bfa2de159be6978acf2702be31a2eeeb", "confirmed_task": "Show me the options for a roundtrip leaving from Las Vegas on flexible dates on the interactive map on united.", "website": "https://www.united.com/", "reference_length": 12, "level": "hard"}
{"task_id": "4091bdd3fa64a5b0d912bc08eaf9c824", "confirmed_task": "Find the list of neighborhood maps for Brooklyn on new.mta.info.", "website": "https://new.mta.info/", "reference_length": 5, "level": "easy"}
{"task_id": "79f0bd7df6e685f30f20025cc6755c0a", "confirmed_task": "Find me the cheapest external Hard Drive for an Xbox One on GameStop.", "website": "https://www.gamestop.com/", "reference_length": 13, "level": "hard"}
{"task_id": "6ebde509dca8f15c0fa1bd74f071e8d6", "confirmed_task": "Search for a job in Miami, Florida, in Human Resources on target.", "website": "https://www.target.com/", "reference_length": 14, "level": "hard"}
{"task_id": "34ccd15a8ea8fd3895af83f5ccf62369", "confirmed_task": "Find out what to do when I lose an item on a bus on us.megabus.", "website": "https://us.megabus.com/", "reference_length": 3, "level": "easy"}
{"task_id": "c698ff3fc0f6cbce39947c597ab5749b", "confirmed_task": "Browse the page with event planning tips on Eventbrite.", "website": "https://www.eventbrite.com/", "reference_length": 5, "level": "easy"}
{"task_id": "b6d10e9bd19b4009a02dea0e98f4e1ae", "confirmed_task": "Check the current standings for MLS on Fox Sports.", "website": "https://www.foxsports.com/", "reference_length": 4, "level": "easy"}
{"task_id": "d71be72aa25c3eab8eea47a0e60382e2", "confirmed_task": "Find technical specs for the latest Macbook Air on Apple.", "website": "https://www.apple.com/", "reference_length": 4, "level": "easy"}
{"task_id": "0b51b4fa0295ae80ccd176ebdad6fff6", "confirmed_task": "Search for a red Toyota Corolla from model years 2018 to 2023 on CarMax.", "website": "https://www.carmax.com/", "reference_length": 13, "level": "hard"}
{"task_id": "3f312ae3efc3c3e90ababe050dd4e7ae", "confirmed_task": "Find the current NFL standings for the AFC East division on NFL.com and go to the page on which team is in first place.", "website": "https://www.nfl.com/", "reference_length": 4, "level": "easy"}
{"task_id": "95cad96f2e43f3c0d8efad1331c77c8c", "confirmed_task": "View the list of the Most Popular TV on rotten tomatoes.", "website": "https://www.rottentomatoes.com/", "reference_length": 3, "level": "easy"}
{"task_id": "bf3b311cc8dce16d3de844f4b5875dfd", "confirmed_task": "Compare Apple watches and  learn more about the ultra version on apple.", "website": "https://www.apple.com/", "reference_length": 4, "level": "easy"}
{"task_id": "b64f938af842f6a1b4489d0e49a785a7", "confirmed_task": "Get the frozen vegan cheese pizza between 5 to 10 USD on Target.", "website": "https://www.target.com/", "reference_length": 17, "level": "hard"}
{"task_id": "5e1b8254c123c80178cc28e0afdb14f0", "confirmed_task": "Find a help page about buying tickets on seatgeek.", "website": "https://seatgeek.com/", "reference_length": 4, "level": "easy"}
{"task_id": "f27c0a7b8b0bb33d37698dff227fc8d7", "confirmed_task": "Browse used Mercedes-Benz cars from model years 2004 to 2012 on KBB and sort by highest price.", "website": "https://www.kbb.com/", "reference_length": 11, "level": "hard"}
{"task_id": "8fdec8eeffd3491e6526cc78c028120b", "confirmed_task": "See Nissan and Honda cars for sale near Kentwood, MI 49512 on CarMax.", "website": "https://www.carmax.com/", "reference_length": 12, "level": "hard"}
{"task_id": "7b182a5087347d494b48a29dbc0f1d3e", "confirmed_task": "Find a shelter or rescue group near zip code 90011.", "website": "https://www.adoptapet.com/", "reference_length": 4, "level": "easy"}
{"task_id": "828c2d98616a9478d5864d847d5a1b28", "confirmed_task": "Browse the list of Civil Division forms.", "website": "https://www.justice.gov/", "reference_length": 4, "level": "easy"}
{"task_id": "608c595eec271fa5dc03506923519994", "confirmed_task": "Calculate a FedEx Ground shipping rate for a 3-pound package from zip code 10019 to zip code 90028.", "website": "https://www.fedex.com/en-us/home.html", "reference_length": 9, "level": "medium"}
{"task_id": "a7a73c8fa75441fc76df9746c327bdd6", "confirmed_task": "Estimate the cost of a photographer in 07055 for a 4-hour project.", "website": "https://www.thumbtack.com/", "reference_length": 8, "level": "medium"}
{"task_id": "cfafe3771369d1d261e9f7ecd44c296d", "confirmed_task": "Find the highest-rated dealer for Cadillac with a rating above 4 stars within 20 miles of zip 60606.", "website": "https://www.cars.com/", "reference_length": 6, "level": "medium"}
{"task_id": "bbbc243b4f18a7a897f0bc84e11d293f", "confirmed_task": "Find out how many assists Chris Paul has been averaging in the current season.", "website": "https://www.nba.com/", "reference_length": 4, "level": "easy"}
{"task_id": "816851ff92ff0219acf4364dcc2c4692", "confirmed_task": "Search for boys' infant pajamas below $40.", "website": "https://www.macys.com/", "reference_length": 10, "level": "medium"}
{"task_id": "8244409b2c82043f966cad05f9afe132", "confirmed_task": "Find the best Audiologist within 50 miles of New York, NY, with a rating of 4 and above.", "website": "https://doctor.webmd.com/", "reference_length": 13, "level": "hard"}
{"task_id": "e7301bb694871429bf2eb36c3a72186c", "confirmed_task": "Find baby shoes priced under $20 with a 5-star rating.", "website": "https://www.macys.com/", "reference_length": 6, "level": "medium"}
{"task_id": "905cb53061c33aa2d77e485fe1fca516", "confirmed_task": "Browse dermatologists within 10 miles of zip code 10019 and filter by only those who accept Blue Medicare Advantage.", "website": "https://www.healthgrades.com/", "reference_length": 11, "level": "hard"}
{"task_id": "fcf4952d2a1d80ea505c555c3c3b54e7", "confirmed_task": "Find the cheapest used  8-cylinder bmw made between 2005-2015 and priced from 25,000 to  50,000 dollars with mileage less than 50,000 miles or less.", "website": "https://www.cars.com/", "reference_length": 11, "level": "hard"}
{"task_id": "3c1ffc3f494e423b3c434c79e35da8f3", "confirmed_task": "Find 12 Monkeys community and view the latest posts mentioning James Cole.", "website": "https://www.reddit.com/", "reference_length": 6, "level": "medium"}
{"task_id": "26a0e5c21c145dd8448aa92f35bec5ea", "confirmed_task": "Browse optometrists who offer telehealth services in Columbus, OH.", "website": "https://www.healthgrades.com/", "reference_length": 3, "level": "easy"}
{"task_id": "070c907d34a4ce71dfdbea38f9c5d4d8", "confirmed_task": "Find a dentist who specializes in pediatric dentistry and is located near zip code 90210 (within 5-mile distance).", "website": "https://www.healthgrades.com/", "reference_length": 7, "level": "medium"}
{"task_id": "43a1ca251f11c6b0bdd0379766cc49e6", "confirmed_task": "Find a neurosurgeon who is over 50 years old and has an appointment available tomorrow.", "website": "https://www.healthgrades.com/", "reference_length": 8, "level": "medium"}
{"task_id": "b3f8bd9198d9d157e0848109563c4b23", "confirmed_task": "Find a permanent job in Logistics within 20 miles of New York, zip 11005, in the middle-income range for a high school diploma holder.", "website": "https://ohiomeansjobs.ohio.gov/", "reference_length": 15, "level": "hard"}
{"task_id": "20a460a8fe1971b84411c5b1e6ac4186", "confirmed_task": "Show theatre events for Las Vegas and select one.", "website": "https://www.stubhub.com/", "reference_length": 3, "level": "easy"}
{"task_id": "db1ffb5e60578597d1c3aa3c389ac7b1", "confirmed_task": "Search for smart TVs with a screen size of 55 to 65 inches and filter the results to show only those that have an LED display.", "website": "https://www.google.com/shopping?udm=28", "reference_length": 5, "level": "easy"}
{"task_id": "7be8cd8dba885cddd9af5320f49bc41b", "confirmed_task": "Find roofing contractors within 5 miles of zip code 10002.", "website": "https://www.bbb.org/", "reference_length": 9, "level": "medium"}
{"task_id": "239a29bde438fe44fe17fe1390ef1634", "confirmed_task": "Find me a gluten-free diet to lose weight for a pregnant woman.", "website": "https://www.healthline.com/", "reference_length": 8, "level": "medium"}
{"task_id": "9f1cba613830ca1c6a58f9498c06e679", "confirmed_task": "Find a premier real estate agent in St Augustine, FL.", "website": "https://www.redfin.com/", "reference_length": 4, "level": "easy"}
{"task_id": "75146b7b67388b9244e0f21a1527c022", "confirmed_task": "Find a male senior boxer near zip code 90028.", "website": "https://www.adoptapet.com/", "reference_length": 10, "level": "medium"}
{"task_id": "59b7b990b4828bc305ab0d7ed6071b55", "confirmed_task": "Get owner-financing homesite land for sale in New Mexico, Luna County,  listed in the last 30 days, and contact the cheapest per acre land seller.", "website": "https://www.landwatch.com/", "reference_length": 9, "level": "medium"}
{"task_id": "9c97bab9c2abfb90a426cbe9addae8d0", "confirmed_task": "Check the details of order 12345 with email 12345@gmail.com.", "website": "https://www.macys.com/", "reference_length": 4, "level": "easy"}
{"task_id": "871e7771cecb989972f138ecc373107b", "confirmed_task": "Find the weather for Vancouver, British Columbia for the next seven days.", "website": "https://www.theweathernetwork.com/", "reference_length": 3, "level": "easy"}
{"task_id": "b69eb4de621e9e265676daac44938f3f", "confirmed_task": "Find an adult husky near zip code 10019.", "website": "https://www.adoptapet.com/", "reference_length": 8, "level": "medium"}
{"task_id": "9bb63ad0e38d5691a618932a8b31c05a", "confirmed_task": "Look for reviews of a Nest Hello Video Doorbell and filter by 1-star ratings.", "website": "https://www.google.com/shopping?udm=28", "reference_length": 5, "level": "easy"}
{"task_id": "8ae510355d978424f490798f900bfa2c", "confirmed_task": "Show me the shared rooms in any university in Melbourne that has a private bathroom wifi, and gas included in the bills.", "website": "https://www.student.com/", "reference_length": 9, "level": "medium"}
{"task_id": "4c186c6ed888d0c8d4cf4adb39443080", "confirmed_task": "Find a medium Devin Booker jersey and add it to the shopping cart.", "website": "https://www.nba.com/", "reference_length": 6, "level": "medium"}
{"task_id": "2fc51dd3febd447f0fdcdabca8d944ce", "confirmed_task": "Locate a self-storage unit near zip code 60538 that can fit about a dorm room full of items and is climate-controlled.", "website": "https://www.extraspace.com/", "reference_length": 9, "level": "medium"}
{"task_id": "eb323dc584156d0eb3a2b90bb8c4b791", "confirmed_task": "Find the latest 2 bed and 1.5+ bath apartment listing for rent in New York.", "website": "https://www.redfin.com/", "reference_length": 12, "level": "hard"}
{"task_id": "87f4c5128e36cdb9366a138a7b61bb00", "confirmed_task": "View the speakers that are bluetooth and wireless and filter the results to only show models that are on sale and cost less than $50.", "website": "https://www.bestbuy.com/", "reference_length": 6, "level": "medium"}
{"task_id": "354b4ddf048815f8fd4163d0d7e1aaa3", "confirmed_task": "Browse marketing jobs and filter by Bachelor's Degree education level.", "website": "https://ohiomeansjobs.ohio.gov/", "reference_length": 6, "level": "medium"}
{"task_id": "e4e097222d13a2560db6f6892612dab6", "confirmed_task": "Search for a young spayed male dog cared for by a private owner within 50 miles of zip 33109.", "website": "https://www.adoptapet.com/", "reference_length": 6, "level": "medium"}
{"task_id": "f389398d2eeb29e5571e00439c57eb76", "confirmed_task": "Find the latest climate news.", "website": "https://www.theweathernetwork.com/", "reference_length": 3, "level": "easy"}
{"task_id": "8ea6c3a2ea3f59150619935261a76d19", "confirmed_task": "Find a staffed FedEx location near zip code 10019 to return a package.", "website": "https://www.fedex.com/en-us/home.html", "reference_length": 7, "level": "medium"}
{"task_id": "c1d6ea6f2196d25782cc3646ff3090db", "confirmed_task": "Create a list of drip coffee makers that are on sale and within $25-60 and have a black finish.", "website": "https://www.google.com/shopping?udm=28", "reference_length": 7, "level": "medium"}
{"task_id": "2dd41b1d0e8f389d0683f4a4627abfe6", "confirmed_task": "Show houses for sale in Maryland with a maximum price of $60,000.", "website": "https://www.landwatch.com/", "reference_length": 7, "level": "medium"}
{"task_id": "f2097f92a10d42a842c14179f422311e", "confirmed_task": "Add a $50 Uber gift card to the cart.", "website": "https://www.bestbuy.com/", "reference_length": 4, "level": "easy"}
{"task_id": "85b284c18d7e78c9b5a9e074e7aa3b98", "confirmed_task": "View the cheapest apartment available for students at the University of Leeds with bills that include WIFI and cleaning services.", "website": "https://www.student.com/", "reference_length": 10, "level": "medium"}
{"task_id": "853afd530c72f4b00ffc32ae854efaf8", "confirmed_task": "Show me the wind flow map for Belo Horizonte.", "website": "https://www.accuweather.com/", "reference_length": 5, "level": "easy"}
{"task_id": "c09721cc937d4dcfb391a0bc2c574b28", "confirmed_task": "Find the next available date for Albion Basin.", "website": "https://www.recreation.gov/", "reference_length": 3, "level": "easy"}
{"task_id": "4c572a627b53b0f9a734ab37f21819b8", "confirmed_task": "Browse apartments with at least 2 bedrooms and 2 bathrooms and a max price of $4000 per month.", "website": "https://craigslist.org/", "reference_length": 5, "level": "easy"}
{"task_id": "301f267f421b93045874726183e8f722", "confirmed_task": "Find healthy savory vegan snack recipes which can be cooked within 5 minutes and contain a high level of protein.", "website": "https://www.healthline.com/", "reference_length": 10, "level": "medium"}
{"task_id": "4f903626f632586fe4728d6664947bab", "confirmed_task": "Find press releases by the antitrust division in 2022.", "website": "https://www.justice.gov/", "reference_length": 4, "level": "easy"}
{"task_id": "3ec0f6138d37fadcb989347a6088ec45", "confirmed_task": "Open the page to learn more about how to get accredited.", "website": "https://www.bbb.org/", "reference_length": 2, "level": "easy"}
{"task_id": "2207bb4f21786690cfed20b37253fb8b", "confirmed_task": "Check the current wind speed in Calgary, Alberta.", "website": "https://www.theweathernetwork.com/", "reference_length": 2, "level": "easy"}
{"task_id": "9c04b71bb8db6cf8e743b2290cbc8797", "confirmed_task": "Find a UPS drop-off point near Miami Florida.", "website": "https://www.ups.com/", "reference_length": 6, "level": "medium"}
{"task_id": "4e0f5561a76478da87995dee00b09572", "confirmed_task": "Show me the monthly weather forecast for Florida City.", "website": "https://www.accuweather.com/", "reference_length": 3, "level": "easy"}
{"task_id": "7562d9b4e4829a44245aafce2e1f62db", "confirmed_task": "Find the nearest location to zip code 54620 that offers size 4 P.O. Boxes.", "website": "https://www.usps.com/", "reference_length": 8, "level": "medium"}
{"task_id": "bd1e3770b7181f6fce9c35e18caa9785", "confirmed_task": "Browse service listings for a solar panel installer and hide duplicates.", "website": "https://craigslist.org/", "reference_length": 3, "level": "easy"}
{"task_id": "330cd04c773ac498f51afa4665461ec8", "confirmed_task": "Browse couches for sale, sort by cheapest, and search in titles only.", "website": "https://craigslist.org/", "reference_length": 6, "level": "medium"}
{"task_id": "ec78d3a635e417bc2a80d03ca93d7165", "confirmed_task": "What are the benefits and financial support a single person living in England, over the state pension age, unemployed, with no health conditions, or caring for someone with one, can get?", "website": "https://www.gov.uk/", "reference_length": 16, "level": "hard"}
{"task_id": "a0a18ca6a3529f3e97c771aadd42d3a0", "confirmed_task": "Add a men's T-shirt that is in large size with a stripe pattern, short sleeve, and under the Best Sellers group to the cart.", "website": "https://www.macys.com/", "reference_length": 7, "level": "medium"}
{"task_id": "82eb3bfedd78456a0230b389f4e7a938", "confirmed_task": "Open the XRP yearly chart.", "website": "https://coinmarketcap.com/", "reference_length": 4, "level": "easy"}
{"task_id": "e7f6cca9a8875f98fee3b711ead3a444", "confirmed_task": "Find the comments made by the user Separate-Camp7202.", "website": "https://www.reddit.com/", "reference_length": 5, "level": "easy"}
{"task_id": "75a1b5dcd2c28508a971d98d51fe5767", "confirmed_task": "Open the reviews of a recipe with beef sirloin.", "website": "https://www.allrecipes.com/", "reference_length": 5, "level": "easy"}
{"task_id": "c03ee2be3d73556ab789c0ad1cbd3451", "confirmed_task": "Find a dog groomer for nail trimming within 100 miles of zip code 10005 and check the detailed service prices of the first one.", "website": "https://www.akc.org/", "reference_length": 11, "level": "hard"}
{"task_id": "05483c50cc9b04c8ac44c574758fb2bd", "confirmed_task": "Look for the best rated BBB accredited charity near 12023.", "website": "https://www.bbb.org/", "reference_length": 8, "level": "medium"}
{"task_id": "a172a5d9ffaf5ef02bd550ec4fe24e6d", "confirmed_task": "Browse the natural products database.", "website": "https://www.drugs.com/", "reference_length": 2, "level": "easy"}
{"task_id": "7e1047f4803237f319c004f7a7f6bccb", "confirmed_task": "Discover the trade-in value of my Intel 7th generation i3 Windows 10, HP laptop in fair condition,  which has 8 GB memory and can be powered on, proceed for the in-store trade-in.", "website": "https://www.bestbuy.com/", "reference_length": 13, "level": "hard"}
{"task_id": "f2be37a9a60fbc25b6b11cf622d17352", "confirmed_task": "Find obedience trials in state of New York during the month of May.", "website": "https://www.akc.org/", "reference_length": 14, "level": "hard"}
{"task_id": "e24662008c3be5d56f986f232fcec447", "confirmed_task": "Find the stock price for WWE over the last month.", "website": "https://www.google.com/finance/", "reference_length": 4, "level": "easy"}
{"task_id": "0170ca95038b05fa58d463fe627ac605", "confirmed_task": "Check if a visa is required to work in the UK for longer than 6 months in Healthcare as an American citizen.", "website": "https://www.gov.uk/", "reference_length": 12, "level": "hard"}
{"task_id": "b3a7da968de13bbdcaed12ffe4993df6", "confirmed_task": "Compare the breeds Afghan Hound, Akita and Azawakh.", "website": "https://www.akc.org/", "reference_length": 9, "level": "medium"}
{"task_id": "515f2e5811cfdd5e0e669e40f17886d8", "confirmed_task": "Search for a new internal M2 Samsung SSD drive between $25 and $200.", "website": "https://www.bestbuy.com/", "reference_length": 8, "level": "medium"}
{"task_id": "4d3157aab34b54e5f0c4b965dfe930f3", "confirmed_task": "Show me community posts about pregnancy fever from the past 30 days.", "website": "https://www.babycenter.com/", "reference_length": 8, "level": "medium"}
{"task_id": "e4e19e04286f644d747d8c5a79d17fac", "confirmed_task": "Find the Drug Interaction Report for Viagra and alcohol.", "website": "https://www.drugs.com/", "reference_length": 6, "level": "medium"}
{"task_id": "cad62d2be0c53f08a416457486b3db23", "confirmed_task": "Search for adoptable dogs near 21122 zip code.", "website": "https://www.adoptapet.com/", "reference_length": 5, "level": "easy"}
{"task_id": "9ef1a8972f375db59c0e6329e11b7939", "confirmed_task": "Find Farms land in Wilkes County, NC with the lowest price.", "website": "https://www.landwatch.com/", "reference_length": 5, "level": "easy"}
{"task_id": "a11ecdff735b51372d536c866011af6f", "confirmed_task": "Explore courses related to Psychology.", "website": "https://www.coursera.org/", "reference_length": 4, "level": "easy"}
{"task_id": "7fff82864f21ddeccf4104a220892824", "confirmed_task": "Find the lowest 27\"-32\" Samsung or LG computer monitors nearby which have 4k, IPS display.", "website": "https://www.google.com/shopping?udm=28", "reference_length": 10, "level": "medium"}
{"task_id": "50d91eabde542906937ab4c5b6f8f23a", "confirmed_task": "Calculate Pregnancy Weight Gain for a 5-week pregnancy with a 169lb weight before pregnancy and a 175lb after pregnancy with a 5.6ft height.", "website": "https://www.babycenter.com/", "reference_length": 9, "level": "medium"}
{"task_id": "dcd26e662a616d373ddd339747c6ce5b", "confirmed_task": "Take a weight management quiz to find a motivating article for a non-exercising, mostly eating out and can't control portions and cravings, and who has a strong support system, enjoys traveling, loves family time and cooking.", "website": "https://www.healthline.com/", "reference_length": 22, "level": "hard"}
{"task_id": "eb2db4b769c145dbe6ba4f74f3e0de98", "confirmed_task": "Find an energetic hairless dog with medium barking.", "website": "https://www.akc.org/", "reference_length": 10, "level": "medium"}
{"task_id": "c0fa2c0e622971955cabf5bcf7b777e8", "confirmed_task": "Search for rentals in Corning, CA with a maximum price of $1500.", "website": "https://www.apartments.com/", "reference_length": 6, "level": "medium"}
{"task_id": "ce616721ce9aeda69890fbccb29677a6", "confirmed_task": "Calculate the price to ship a large flat-rate box from 77449 to 77084 at the first available date and time.", "website": "https://www.usps.com/", "reference_length": 8, "level": "medium"}
{"task_id": "9d09bc948462db032bac98968b11b008", "confirmed_task": "Find NHL events occurring in Boston.", "website": "https://www.stubhub.com/", "reference_length": 7, "level": "medium"}
{"task_id": "29526b17a32485742b5ab63507e99417", "confirmed_task": "Browse Humira dosage information.", "website": "https://www.drugs.com/", "reference_length": 3, "level": "easy"}
{"task_id": "d7c955b47af68e01766fa86d0bee08a7", "confirmed_task": "Add Elevate at Chicago, IL, to favorites and show a virtual tour.", "website": "https://www.apartments.com/", "reference_length": 4, "level": "easy"}
{"task_id": "9d090a15c214eb070d9caa8a034d03c1", "confirmed_task": "Find the lowest-priced Student housing near Liverpool International College which has been priced between 100 to 300 pounds and has a private bathroom.", "website": "https://www.student.com/", "reference_length": 14, "level": "hard"}
{"task_id": "5916018d1cad999881018cac1216a692", "confirmed_task": "Find a personal trainer service at 10040 for a 25-year-old client aiming to build muscle.", "website": "https://www.thumbtack.com/", "reference_length": 6, "level": "medium"}
{"task_id": "0059adc6b12a3822305deb68929b2de8", "confirmed_task": "Find support services jobs in Bentonville, in the state of Arkansas.", "website": "https://careers.walmart.com/", "reference_length": 8, "level": "medium"}
{"task_id": "07bdc595306729a028ba06cc7451a80a", "confirmed_task": "Select a high speed train ticket with a departure time before 23:00  from Shanghai to Beijing.", "website": "https://us.trip.com/", "reference_length": 7, "level": "medium"}
{"task_id": "64b76158720a69e4a5c31a55d54928bf", "confirmed_task": "Compare two pescatarian diets for eating healthier.", "website": "https://www.healthline.com/", "reference_length": 10, "level": "medium"}
{"task_id": "e3ab665e01e7632ce33ac1aeca14aff6", "confirmed_task": "Find the next available dates for Alley Creek Camp.", "website": "https://www.recreation.gov/", "reference_length": 3, "level": "easy"}
{"task_id": "2d5a7f95f951a26838289dfd629ae850", "confirmed_task": "Find a list of houses for sale in zip code 85747 with a private pool.", "website": "https://www.redfin.com/", "reference_length": 8, "level": "medium"}
{"task_id": "26810ed9c123a62992e3eed31db3c5ee", "confirmed_task": "Show daily weather for New York City.", "website": "https://www.accuweather.com/", "reference_length": 4, "level": "easy"}
{"task_id": "c181f903ec1107b850032c17cad88393", "confirmed_task": "Help me identify a pink round pill with 150 written on it.", "website": "https://www.webmd.com/", "reference_length": 7, "level": "medium"}
{"task_id": "ef289e34a2f59a707cb07e2a6229ff03", "confirmed_task": "Compare the Acura CL 2003 with the ILX 2022.", "website": "https://www.cars.com/", "reference_length": 9, "level": "medium"}
{"task_id": "84f806c7fc15576673915f195efa72df", "confirmed_task": "Find a nationwide nearest animal shelter for birds around zip 10012.", "website": "https://www.adoptapet.com/", "reference_length": 8, "level": "medium"}
{"task_id": "be9e7dca1222714571ef3d7d59d2a41c", "confirmed_task": "Find out the cold and flu forecast and today's air quality in Champaign, IL.", "website": "https://weather.com/", "reference_length": 6, "level": "medium"}
{"task_id": "11abb668c751dd56bb41f296a8bb3a13", "confirmed_task": "Find a store near zip 30010 that provides authorized Apple services for imacs and make this one my store.", "website": "https://www.bestbuy.com/", "reference_length": 10, "level": "medium"}
{"task_id": "207e933d1bba815bcb58664b5d82c085", "confirmed_task": "Find Ohio City apartments with parking, a fitness center, and an elevator.", "website": "https://www.apartments.com/", "reference_length": 6, "level": "medium"}
{"task_id": "29b7372d5a3884a2ba831af2d117af3c", "confirmed_task": "Browse the first top news of Microsoft stock on Google Finance.", "website": "https://www.google.com/finance/", "reference_length": 3, "level": "easy"}
{"task_id": "5c00e9561eae94789443f405525a5869", "confirmed_task": "Find the recommended dosage for Vivitrol.", "website": "https://www.healthline.com/", "reference_length": 5, "level": "easy"}
{"task_id": "2532fd402d3c741b79894e6ff2269f53", "confirmed_task": "find electricians near 10203.", "website": "https://www.thumbtack.com/", "reference_length": 3, "level": "easy"}
{"task_id": "9829f3087ab1f9c8eba6b6dd2b831d25", "confirmed_task": "Play the latest video from NBA TV.", "website": "https://www.nba.com/", "reference_length": 3, "level": "easy"}
{"task_id": "783ce6a3499fa7cf25bc12f8f0ecbbbb", "confirmed_task": "Find Florida internship programs in the Mayo Clinic College of Medicine and Science.", "website": "https://www.mayoclinic.org/", "reference_length": 5, "level": "easy"}
{"task_id": "6db4a0e346976f2729ba9afcd3208941", "confirmed_task": "Look up tracking information for shipment #3023858502.", "website": "https://www.fedex.com/en-us/home.html", "reference_length": 2, "level": "easy"}
{"task_id": "1fc28d91d25ccd1c6ba268101326a654", "confirmed_task": "Find the 5-day price chart for Bitcoin.", "website": "https://www.google.com/finance/", "reference_length": 3, "level": "easy"}
{"task_id": "255bf27c43fd3f9254d6b81a5f36d3a9", "confirmed_task": "Look for the largest hunting land for auction in Kansas high plain region with mineral rights posted in the last seven days.", "website": "https://www.landwatch.com/", "reference_length": 9, "level": "medium"}
{"task_id": "a8b9edd598561d2de901864d5f40fe67", "confirmed_task": "Calculate the shipping cost for 4 pound package from Texas to New York.", "website": "https://www.fedex.com/en-us/home.html", "reference_length": 9, "level": "medium"}
{"task_id": "a6f0434ce6aff5f9b03681241b03ad82", "confirmed_task": "Find the closing stock price for Tesla on March 17, 2023.", "website": "https://finance.yahoo.com/", "reference_length": 3, "level": "easy"}
{"task_id": "415bf9da6f3db3a735ecbba3b0c76c15", "confirmed_task": "Find the nearest vet within 50 miles of zip 75228.", "website": "https://www.akc.org/", "reference_length": 9, "level": "medium"}
{"task_id": "8103786e0e5976ebf961bd062d5f39cd", "confirmed_task": "Find possible causes for the symptoms of chest pain which is sharp which is accompanied by anxiety.", "website": "https://www.mayoclinic.org/", "reference_length": 9, "level": "medium"}
{"task_id": "92160852a6bbbc165cee4e14ab0b1d59", "confirmed_task": "Find the shipping cost of a Common medium-sized box in flat-rate shipping and compare it with other parcel services.", "website": "https://www.ups.com/", "reference_length": 5, "level": "easy"}
{"task_id": "502e864440283214e0180645015f568b", "confirmed_task": "Check permit availability for a group of 4 in Brooks Camp, Katmai National Park on May 22.", "website": "https://www.recreation.gov/", "reference_length": 8, "level": "medium"}
{"task_id": "7680a920359cb1a508fbddb001b98167", "confirmed_task": "See the prediction about the girl child's height, whose current height at seven years is 4 feet and whose weight is 55 lbs, her mother is 5 feet 2, and her father is 5 feet 8.", "website": "https://www.babycenter.com/", "reference_length": 11, "level": "hard"}
{"task_id": "07ec4a12cba8090e2dc524d558ac7675", "confirmed_task": "Check drug interaction for melatonin and Folate Forte.", "website": "https://www.drugs.com/", "reference_length": 6, "level": "medium"}
{"task_id": "987bad7c6d4726d64232a8a1c3386888", "confirmed_task": "Find the seller info and seller's notes about the used car model 2011 BMW 135 with a max price of $30000.", "website": "https://www.cars.com/", "reference_length": 11, "level": "hard"}
{"task_id": "15be05973fba714e490cd9c884e4f072", "confirmed_task": "Find the procedure to get the license for Athletic Trainer.", "website": "https://ohio.gov/", "reference_length": 6, "level": "medium"}
{"task_id": "3adeea7627f4343069f38adae40f73d0", "confirmed_task": "Within 25 Miles of 96817, find a nursing home that accepts medicare.", "website": "https://health.usnews.com/", "reference_length": 7, "level": "medium"}
{"task_id": "c94551d2b18f9ad0ab31b0bd98ca42e3", "confirmed_task": "Find cats available for adoption within 10 miles of zip code 94587, Young or adult-age cats, sorted by Oldest Addition.", "website": "https://www.petfinder.com/", "reference_length": 10, "level": "medium"}
{"task_id": "4e801ba102dfaf22c7cf7a126b107609", "confirmed_task": "Find Linux platform software developers in 10080 who master the Python language and Java language with web interface project type.", "website": "https://www.thumbtack.com/", "reference_length": 8, "level": "medium"}
{"task_id": "39c388cdc468688c8139cc2bb5157c13", "confirmed_task": "Calculate the estimated car loan payment amount for an average credit-rated person for a 15,000-dollar car with a down payment of 2000 dollars and loan tenure of 48 months in zip 65215 and shop for the lowest-priced car.", "website": "https://www.cars.com/", "reference_length": 9, "level": "medium"}
{"task_id": "c8d7f2aa7eb5dd074c48c9f76f8659ad", "confirmed_task": "Show Teen Driver Safety program information.", "website": "https://www.dmv.virginia.gov/", "reference_length": 2, "level": "easy"}
{"task_id": "fd787623166785d84093565bf945fd24", "confirmed_task": "Check the interaction between Novolin N and Novolin R.", "website": "https://www.drugs.com/", "reference_length": 6, "level": "medium"}
{"task_id": "c3307a70bb12ebf56cc9ec926b368f15", "confirmed_task": "Find the interactions between Eulexin and hepatic dysfunction.", "website": "https://www.drugs.com/", "reference_length": 5, "level": "easy"}
{"task_id": "9586827ad04ee2362f4f0076bf0f0468", "confirmed_task": "Find the side effects of taking Montelukast.", "website": "https://www.drugs.com/", "reference_length": 6, "level": "medium"}
{"task_id": "34992feb69eb8e788faa06868b365c49", "confirmed_task": "Submit a request for vehicle registration renewal with title number X123456 and last 4 digits of VIN is 1234.", "website": "https://www.dmv.virginia.gov/", "reference_length": 5, "level": "easy"}
{"task_id": "47b93b9e649eadeb8d96a6e3df715c2d", "confirmed_task": "Show me Diagnoses & Treatment for Female infertility.", "website": "https://www.mayoclinic.org/", "reference_length": 4, "level": "easy"}
{"task_id": "3443e9c3151fef19a3c3a45eb2c13640", "confirmed_task": "Search for the ovulation calculator and enter Mar 1 as the first date of the period and calculate the date of ovulation and pregnancy test day.", "website": "https://www.webmd.com/", "reference_length": 12, "level": "hard"}
{"task_id": "6b5be1764692d1dc8f17dc4375b2daa8", "confirmed_task": "Show me historical data for EUR/USD.", "website": "https://finance.yahoo.com/", "reference_length": 4, "level": "easy"}
{"task_id": "16200f51d63f0a47a58fa17acd49e368", "confirmed_task": "Find a recipe that includes eggplant and mushrooms.", "website": "https://cookpad.com/", "reference_length": 3, "level": "easy"}
{"task_id": "c2153fc053112e89c2f103869c4d6890", "confirmed_task": "Find a house cleaning service in 10001 on a weekly basis.", "website": "https://www.thumbtack.com/", "reference_length": 5, "level": "easy"}
{"task_id": "5e4e89c9b6fdaee7a41aca5601b82e04", "confirmed_task": "Identify a pill with a pink color and oval shape with 894 5 number on it.", "website": "https://www.drugs.com/", "reference_length": 8, "level": "medium"}
{"task_id": "60cbbbd58eb9d28b053aef945f464228", "confirmed_task": "Look up if the phone number 555555555 is a scam.", "website": "https://www.bbb.org/", "reference_length": 6, "level": "medium"}
{"task_id": "8f80e64e44e1fada018997b2fe869683", "confirmed_task": "What are the top posts of all time on Reddit?", "website": "https://www.reddit.com/", "reference_length": 3, "level": "easy"}
{"task_id": "65c4030f22fb6eb101acfee4825f1318", "confirmed_task": "Find a female MD Cardiologist in Jacksonville, Florida.", "website": "https://www.mayoclinic.org/", "reference_length": 8, "level": "medium"}
{"task_id": "6ca20f1da01edeb49a7a42c816d8c6fe", "confirmed_task": "Find the Eligibility to get the child benefit and How it works and how to claim", "website": "https://www.gov.uk/", "reference_length": 8, "level": "medium"}
{"task_id": "2e4e21cf1449c6894b17d571c47b77ea", "confirmed_task": "Find an English bulldog near zip code 90028 that was cared for by a private owner.", "website": "https://www.adoptapet.com/", "reference_length": 8, "level": "medium"}
{"task_id": "1df24ec81137386d6476bcf343a79012", "confirmed_task": "Search for NordicTrack with the lowest price.", "website": "https://www.bestbuy.com/", "reference_length": 6, "level": "medium"}
{"task_id": "4639a54f3ab549864fd8d60b7398b1e1", "confirmed_task": "Find a white female kitten within 35 miles of zip 77494.", "website": "https://www.adoptapet.com/", "reference_length": 10, "level": "medium"}
{"task_id": "9af05e392cf3f5a8ff17aa764ba5bda6", "confirmed_task": "Get a quote from C and above-rated solar energy equipment company within 10 miles of Miami, Florida.", "website": "https://www.bbb.org/", "reference_length": 16, "level": "hard"}
{"task_id": "627f7a18d85f29a687234f1ade4585c2", "confirmed_task": "Find the current league leader in total blocked shots.", "website": "https://www.nba.com/", "reference_length": 5, "level": "easy"}
{"task_id": "0b838cd54f826c59c71f600c56b89a11", "confirmed_task": "Find all the locations for the second-best-rated used car dealer less than 5 miles from New York.", "website": "https://www.bbb.org/", "reference_length": 11, "level": "hard"}
{"task_id": "5dec0e6620849459f29e6465982c597e", "confirmed_task": "Search for 33 to 49inch Qled gaming monitor with a 240hz refresh rate that is within $1000 to $2000.", "website": "https://www.bestbuy.com/", "reference_length": 11, "level": "hard"}
{"task_id": "52efbab520734ef9bf7c09ba0f62cdc8", "confirmed_task": "Find the app for iOS.", "website": "https://www.recreation.gov/", "reference_length": 2, "level": "easy"}
{"task_id": "b1ce968a361e1088ce8d2ade6c2c9af0", "confirmed_task": "Find young cats in Seattle and show off the newest additions.", "website": "https://www.petfinder.com/", "reference_length": 6, "level": "medium"}
{"task_id": "23204728192da9f73197a613d9681c18", "confirmed_task": "What are the Symptoms and causes of fever?", "website": "https://www.mayoclinic.org/", "reference_length": 3, "level": "easy"}
{"task_id": "a69d2934fe54fef165490a5a2d95bf38", "confirmed_task": "Show me recipes for pancakes with wheat and without beetroot.", "website": "https://cookpad.com/", "reference_length": 6, "level": "medium"}
{"task_id": "e9f4dfc67e0e6aa37f05f7cc5aa7428c", "confirmed_task": "Browse pediatricians near zip code 90028 who specialize in Internal Medicine and have a rating of at least 4 stars.", "website": "https://www.healthgrades.com/", "reference_length": 9, "level": "medium"}
{"task_id": "2218042362d8fae73756eb309848c2b2", "confirmed_task": "Compare Audi A7 with Audi A6, both made in 2023, and hide similarities.", "website": "https://www.cars.com/", "reference_length": 9, "level": "medium"}
{"task_id": "ba2a469af584f16da93ce6a7430cf7e5", "confirmed_task": "Search for a beginner\u2019s course in computer science that includes advertisement skills.", "website": "https://www.coursera.org/", "reference_length": 7, "level": "medium"}
{"task_id": "26784156ae9859a0dd6c5920eb106f91", "confirmed_task": "calculate and search rent for a $6000 monthly income with 30% rent budget near 90012 area.", "website": "https://www.apartments.com/", "reference_length": 8, "level": "medium"}
{"task_id": "47e314cc452c540524ffb7cf520285a3", "confirmed_task": "Find the park that offers the cheapest paddling permits.", "website": "https://www.recreation.gov/", "reference_length": 6, "level": "medium"}
{"task_id": "271b36efd4346721b5542488ff997042", "confirmed_task": "Browse 8K Samsung TVs that are open box.", "website": "https://www.bestbuy.com/", "reference_length": 4, "level": "easy"}
{"task_id": "6b2cfae0ef25c73d1224b6ab74cb8b63", "confirmed_task": "Find Devin Booker's highest-scoring points per game playoff run.", "website": "https://www.nba.com/", "reference_length": 7, "level": "medium"}
{"task_id": "0a54069a0ef542e571d1fee7f39c93d5", "confirmed_task": "Browse senior spayed/neutered dogs near zip code 90028.", "website": "https://www.adoptapet.com/", "reference_length": 6, "level": "medium"}
{"task_id": "4e3f6a538cc1f7321cfc50260db9545d", "confirmed_task": "Look up the current temperature for zip code 10019.", "website": "https://www.theweathernetwork.com/", "reference_length": 2, "level": "easy"}
{"task_id": "f00e7accfb4a5e09680bdb326e6274ad", "confirmed_task": "Check the hourly forecast for Boston.", "website": "https://www.accuweather.com/", "reference_length": 3, "level": "easy"}
{"task_id": "6174e5ddd40cfbdc33ee1502f40bac39", "confirmed_task": "Find a day-use park that offers horseback riding near Nashville.", "website": "https://www.recreation.gov/", "reference_length": 6, "level": "medium"}
{"task_id": "547f5729c59d5d12a457a3ebb74c31c6", "confirmed_task": "Search for 3 bedroom condos with 2 bathrooms within $1500- $2500 range in NYC.", "website": "https://www.apartments.com/", "reference_length": 14, "level": "hard"}
{"task_id": "0b2623e9fa5cea997f76490bcbc5220f", "confirmed_task": "Find a list of shorthaired dogs available for adoption within 100 miles of zip code 94587 that are good with kids and cats, and have been on Petfinder for over 30 days.", "website": "https://www.petfinder.com/", "reference_length": 13, "level": "hard"}
{"task_id": "3ae28b3c440efe87dc700480b78ac608", "confirmed_task": "Find the closest 5-star rated dentist to zip code 98011.", "website": "https://www.healthgrades.com/", "reference_length": 9, "level": "medium"}
{"task_id": "0632e496d37badee0350dad358f047c5", "confirmed_task": "Browse recipes for gluten-free chocolate chip cookies that can be made without nuts.", "website": "https://cookpad.com/", "reference_length": 4, "level": "easy"}
{"task_id": "aafd1fddea1558466ac6133934d35156", "confirmed_task": "Find a Single-Family House for Rent in Houston, TX with 1 bed.", "website": "https://www.apartments.com/", "reference_length": 8, "level": "medium"}
{"task_id": "246d654fab7c31d9651007e39e75f74f", "confirmed_task": "Open the most helpful 5-star reviews of Alpine Ridge.", "website": "https://www.recreation.gov/", "reference_length": 5, "level": "easy"}
{"task_id": "690d7b4a285fdb1e9dabf973bf46ae4d", "confirmed_task": "Browse iPhone X for sale that is in good condition, has a max price of 400, and searches in titles only.", "website": "https://craigslist.org/", "reference_length": 8, "level": "medium"}
{"task_id": "c43a7dccf5c44f7b45a821e712dd1970", "confirmed_task": "Take a newsletter subscription with my email id (buckeye.foobar@gmail.com) for Allergies and asthma, Anxiety and depression, nutrition, diabetes, breast cancer, and migraine with email id.", "website": "https://www.healthline.com/", "reference_length": 8, "level": "medium"}
{"task_id": "d5c34bf39eb6096ae5d439325cde4d32", "confirmed_task": "Find a DMV center in Richmond.", "website": "https://www.dmv.virginia.gov/", "reference_length": 5, "level": "easy"}
{"task_id": "180ed2ec377ef3a4af9035a21522091a", "confirmed_task": "Find the way to give a gift to UM-Dearborn.", "website": "https://umich.edu/", "reference_length": 5, "level": "easy"}
{"task_id": "c521933dad9c0ef9f1dfa2f38b8e4405", "confirmed_task": "See the monthly forecast for Atlanta, GA.", "website": "https://www.accuweather.com/", "reference_length": 3, "level": "easy"}
{"task_id": "9b5dfe54a1c14c5c6336bae7374c3bb5", "confirmed_task": "Find a UPS Access Point near SPRING, TX and services provided by them.", "website": "https://www.ups.com/", "reference_length": 8, "level": "medium"}
{"task_id": "c073ac1bcf40f84c599affc97edbc396", "confirmed_task": "Search for the cheapest apartment in Detroit for a student.", "website": "https://www.apartments.com/", "reference_length": 9, "level": "medium"}
{"task_id": "73d08420706ae205a9c5be28b6d4e80f", "confirmed_task": "Show me the rules and cancellation for Alley Spring.", "website": "https://www.recreation.gov/", "reference_length": 3, "level": "easy"}
{"task_id": "0a0fa834ce41b5297c6474293383759d", "confirmed_task": "What are the onboard activities of the highest-rated Regent Seven Seas Cruise ship based on Costco member reviews?", "website": "https://www.costco.com/", "reference_length": 8, "level": "medium"}
{"task_id": "a13e4231a3d6a7000c622c56448d97ba", "confirmed_task": "Find an Airbnb in Cleveland for three nights. The check-in date is the day after tomorrow. We have 2 adults, 2 kids, and 1 pet. The budget is $100 to $300 per night. Essential amenities include free parking, a washer, and a gym.", "website": "https://www.airbnb.com/", "reference_length": 19, "level": "hard"}
{"task_id": "bb518416a786fdb9b9bbf0c78515595e", "confirmed_task": "Browse the class schedule of graduate-level computer science courses.", "website": "https://www.osu.edu/", "reference_length": 4, "level": "easy"}
{"task_id": "b99c02965196d51e80ac7539e33f335b", "confirmed_task": "Please find graduate-level computer science courses scheduled on Tuesdays starting time from 2:00 to 6:00 PM in the Fall 2023 semester.", "website": "https://www.berkeley.edu/", "reference_length": 9, "level": "medium"}
{"task_id": "27fa3ac20745d3d35e89fae157f63069", "confirmed_task": "Browse the class schedule of graduate-level chemistry courses on Monday afternoons in the winter of 2023.", "website": "https://www.stanford.edu/", "reference_length": 11, "level": "hard"}
{"task_id": "b4aa7315e31dfcdc52baf7771be260c9", "confirmed_task": "Find the HGX H100 driver for Ubuntu 22.04 on AMD64 CPU.", "website": "https://www.nvidia.com/", "reference_length": 11, "level": "hard"}
{"task_id": "442a450e696a96085257db6297891a4d", "confirmed_task": "Using a calculator to determine how much I can have in my 401(k) account at retirement, if I work from age 22 to 65, with an annual rate of return of 3%, annual employee contributions of $8,000, and annual employer contributions of $8,000.", "website": "https://www.chase.com/", "reference_length": 11, "level": "hard"}
{"task_id": "9ed3827266b3b804f485859c3d00401e", "confirmed_task": "If I'm 30, plan to retire at 65, and can save $300/month, with a 3% annual return, 13% current tax rate, and 24% retirement tax rate, show the comparison chart between Traditional and Roth IRA.", "website": "https://www.chase.com/", "reference_length": 12, "level": "hard"}
{"task_id": "c801d1c951f59297f526bab84fa86c6e", "confirmed_task": "Browse the latest negative reviews from players with over 100 hours of playtime for the game that won the 2023 VR Game of the Year Award.", "website": "https://store.steampowered.com/", "reference_length": 11, "level": "hard"}
{"task_id": "7c09c2c7c87cf6bb1138701eb54284ea", "confirmed_task": "Find the comments for the most popular news in the past month under the Quantum Physics topic.", "website": "https://phys.org/", "reference_length": 8, "level": "medium"}
{"task_id": "afcebfed28bea091d58f49ea6cb8194b", "confirmed_task": "Find the most reviewed gluten-free multivitamins from CVS Health Brand under $15.", "website": "https://www.cvs.com/", "reference_length": 12, "level": "hard"}
{"task_id": "64345c365f544375357c7b67917f08a0", "confirmed_task": "Look for the newest refrigerator that is 34-36 inches wide, priced between $1,000 and $2,000, and has a customer review rating of 4 stars or higher.", "website": "https://www.costco.com/", "reference_length": 8, "level": "medium"}
{"task_id": "ab6ee3b83aab6cd283320f5e01003cff", "confirmed_task": "Find the tech specs of the MacBook Pro 16-inch introduced in November 2023.", "website": "https://www.apple.com/", "reference_length": 7, "level": "medium"}
{"task_id": "33bd2cdcea4fcc42a09a8a1e4e5841c6", "confirmed_task": "Add a 5-piece Tenders Combo to my bag with Sweet Corn as the side, Sweet Tea as the drink, and both Honey BBQ and Honey Mustard sauces. Select the store closest to Zip code 10001 for pick-up tomorrow at 12:00 PM.", "website": "https://www.kfc.com/", "reference_length": 23, "level": "hard"}
{"task_id": "47186fac8e7c7277af01144644eb4e0b", "confirmed_task": "What is the ownership cost of the first car in the list \"top buys 2025\"?", "website": "https://www.parkers.co.uk/", "reference_length": 3, "level": "easy"}
{"task_id": "fa9adb815b85d259f943d81874a052e5", "confirmed_task": "Browse a user homepage that reposted the top song from the Top 50 Rock chart.", "website": "https://soundcloud.com/", "reference_length": 6, "level": "medium"}
{"task_id": "b922508886ded315c9835457a6eb43ea", "confirmed_task": "Browse tenured/tenure-track faculty positions in Computer Sciences & Technology in California.", "website": "https://jobs.chronicle.com", "reference_length": 6, "level": "medium"}
{"task_id": "5d542a7ec1fa142ba73cc87d970caf39", "confirmed_task": "Find the most cited publication at the 2022 CVPR main conference.", "website": "https://dblp.org/", "reference_length": 6, "level": "medium"}
{"task_id": "864244b6969e0f8733b0eb1ca06cd51f", "confirmed_task": "Find the race time for who wins the first place in the last race of the 2023 Formula 1 (F1).", "website": "https://www.espn.com/", "reference_length": 6, "level": "medium"}
{"task_id": "01abae9608f2d8752a83e08f136f720c", "confirmed_task": "Show me the code for the company that is the top mover in the Cboe Europe Technology Sector Index (BEPTEC) as of the latest market close.", "website": "https://www.cboe.com/", "reference_length": 6, "level": "medium"}
{"task_id": "da8f3823a827c7d3a492f383808e7912", "confirmed_task": "Find and open the earliest press release.", "website": "https://www.instructure.com/", "reference_length": 6, "level": "medium"}
{"task_id": "8689af4d33ce00bf2cdd8987d3bbfd86", "confirmed_task": "Add the cheapest certified refurbished iPad Air with 256GB of storage in any shade of blue to my bag.", "website": "https://www.apple.com/", "reference_length": 8, "level": "medium"}
{"task_id": "78f397336b6fd1cbba0127db7a8cd502", "confirmed_task": "Browse the upcoming SuperBike events taking place in Italy.", "website": "https://www.redbull.com/", "reference_length": 8, "level": "medium"}
{"task_id": "3dca7cbe7d086619d837ff9f5312cebc", "confirmed_task": "Can you show me products under the category path 'Automotive' -> 'Car Jack', with an additional filter for the color pink?", "website": "https://us.shein.com/", "reference_length": 4, "level": "easy"}
{"task_id": "b962927dfe03bf2274a54381127ed433", "confirmed_task": "Find the best-selling vinyl record by an artist from New York City in the classical music genre.", "website": "https://bandcamp.com/", "reference_length": 8, "level": "medium"}
{"task_id": "78baf9dbe7c3532f7d7ef4cc22a7f065", "confirmed_task": "Find the most popular digital trends report in the Finance & Insurance industry within the region of China.", "website": "https://www.statista.com/", "reference_length": 8, "level": "medium"}
{"task_id": "c7c07ec10c668625a21ba64165d719bb", "confirmed_task": "Find the total monthly price for four prepaid unlimited lines without autopay discounts.", "website": "https://www.verizon.com/", "reference_length": 8, "level": "medium"}
{"task_id": "512fd4deab099b8dc0dcfc0ec48a3c63", "confirmed_task": "Identify the open issue with the most comments in the first trending open-source repository this week.", "website": "https://github.com/", "reference_length": 8, "level": "medium"}
{"task_id": "d9d8b7d84a3f8d057e368254fe8d65e2", "confirmed_task": "Find the first commit submitted by NielsRogge to the official repository of the SAM2 model.", "website": "https://github.com/", "reference_length": 8, "level": "medium"}
{"task_id": "157f4a79d55e8fa3fd55ba772ba40fbc", "confirmed_task": "Find the most popular blue Lilo & Stitch toys.", "website": "https://www.disney.com/", "reference_length": 9, "level": "medium"}
{"task_id": "62c8d970b3d13891f355911e5a8f4030", "confirmed_task": "Find the top game listed in the Steam Deck's top-played list over the past year. Then, browse reviews for that game from players who have played over 100 hours and primarily use a Steam Deck.", "website": "https://store.steampowered.com/", "reference_length": 9, "level": "medium"}
{"task_id": "11857213ca01510f12813740afd59918", "confirmed_task": "Add the most top-selling Adidas men's basketball shoe in red, size 10 to my cart.", "website": "https://www.adidas.com/", "reference_length": 10, "level": "medium"}
{"task_id": "47bfe8a7e0e4e7efc837287b407fbe90", "confirmed_task": "Compare the first and second most popular smartphones manufactured by Xiaomi and show the comparison chart.", "website": "https://versus.com/", "reference_length": 10, "level": "medium"}
{"task_id": "bb314cb80f0f8489135cbf59074d11e2", "confirmed_task": "Open the page for the first Best Paper Award video recording of talks from ICLR 2016.", "website": "https://iclr.cc/", "reference_length": 4, "level": "easy"}
{"task_id": "1aeca99e6a60b0e3aefb3ef212bdce79", "confirmed_task": "Find full-time legal occupation jobs in San Diego County with a minimum salary of $4,000+ per month.", "website": "https://www.ca.gov/", "reference_length": 10, "level": "medium"}
{"task_id": "d730f4ff450da1bd60a836163736ef6a", "confirmed_task": "Find the best-selling GORE-TEX men's hiking shoe priced between $100.00 and $199.99 with a rating of 4 stars or higher, and show its most helpful comment.", "website": "https://www.rei.com/", "reference_length": 10, "level": "medium"}
{"task_id": "fe33894188d20d7469f37a9fd855e7ff", "confirmed_task": "Find me Python 3.9 packages on PyPI that are designed for the Web Environment, licensed under MIT, have a stable production status, and are intended for developers.", "website": "https://pypi.org/", "reference_length": 11, "level": "hard"}
{"task_id": "71f8de1834599fba443f40dbbfab8edd", "confirmed_task": "Search for papers related to reinforcement learning under the topics of computer science and mathematics on arxiv, with recent submission dates between September 2024 and January 2025.", "website": "https://arxiv.org/", "reference_length": 11, "level": "hard"}
{"task_id": "c8c1ff115879b3afd14280beb1559b13", "confirmed_task": "Find the latest Doraemon video in MP4 format that is over 20 minutes long and has a medium file size.", "website": "https://www.4shared.com/", "reference_length": 12, "level": "hard"}
{"task_id": "d4fb78b7e74508cd3b33f01cf9200997", "confirmed_task": "Show the figure comparing Occupational Fatalities Trends between Ohio and New York.", "website": "https://www.americashealthrankings.org/", "reference_length": 12, "level": "hard"}
{"task_id": "0e42c3a73f2aece1f854e0ba55b7c8b0", "confirmed_task": "Find a gas station in Manhattan, NY with a rating above 4.0, and sort the user reviews by the lowest rating.", "website": "https://www.google.com/maps/", "reference_length": 7, "level": "medium"}
{"task_id": "96afb3c51146b0c2a9c55f039a5ea6d6", "confirmed_task": "Find the most frequent word that rhymes with \"thought\" and has three syllables.", "website": "https://www.merriam-webster.com/", "reference_length": 5, "level": "easy"}
{"task_id": "59912927c1fddee6ded8a49986896bc2", "confirmed_task": "Look for the most useful reviews of the highest-rated anti-reflective TVs with screen sizes from 55\" to 64\" and prices ranging from $300 to $1500.", "website": "https://www.samsung.com/", "reference_length": 14, "level": "hard"}
{"task_id": "e43cbc8a0bf9e999884928d11006f894", "confirmed_task": "Browse the list of things to do in Miami that have a rating of 9+ (wonderful), last between 1 to 4 hours per session, cost under $100 per person, and are available for booking between next Monday and next Friday.", "website": "https://www.expedia.com/", "reference_length": 15, "level": "hard"}
{"task_id": "1b867afecf072cb877ebfa4069263746", "confirmed_task": "Display the figure comparing unemployment trends among women in Illinois and Michigan.", "website": "https://www.americashealthrankings.org/", "reference_length": 15, "level": "hard"}
{"task_id": "c3a333968fc3c43d7f2688f425a0d633", "confirmed_task": "Find the cheapest certified pre-owned Porsche 911 with a model year of 2019 or newer, within a 200-mile radius of ZIP code 97007.", "website": "https://www.porsche.com/", "reference_length": 15, "level": "hard"}
{"task_id": "bb5d90e6f2fbc0ae146f7c1998c2b4a1", "confirmed_task": "Find the most viewed TED talk on the topic of robots that lasts between 12 and 18 minutes.", "website": "https://www.ted.com/", "reference_length": 15, "level": "hard"}
{"task_id": "c577a14301a725e09ccd269a3e0b271e", "confirmed_task": "Return the page for the highest-rated red wine from Oregon under $40 that pairs well with either mushrooms or veal.", "website": "https://www.vivino.com/", "reference_length": 15, "level": "hard"}
{"task_id": "c6c9dc6079677cef594cec2fa6b16602", "confirmed_task": "Add the cheapest black sofa with at least three seats, a leather finish, and at least four stars to my cart.", "website": "https://www.ikea.com/", "reference_length": 16, "level": "hard"}
{"task_id": "c39d6c245f8243993e707d54d2f4acec", "confirmed_task": "Browse the final skin in the list for the champion Ahri.", "website": "https://www.leagueoflegends.com/", "reference_length": 18, "level": "hard"}
{"task_id": "b2f4fde2fce122a93c7b578086cb0585", "confirmed_task": "Find the cheapest hotel + flight + car package from New York to San Francisco, departing tomorrow and returning on the fourth day from departure, for two adults and a six-year-old child. The package should be one room with free breakfast and spa access.", "website": "https://www.booking.com/", "reference_length": 19, "level": "hard"}
{"task_id": "d02d236836924919f35f2438d9ed2374", "confirmed_task": "Browse the top 250 movies and find one movie that is available on AMC+.", "website": "https://www.imdb.com/", "reference_length": 22, "level": "hard"}
{"task_id": "3621b099326c7aebd2e2dac6be3b52d1", "confirmed_task": "Open the profile page of the leader of the Nvidia Learning and Perception Lab.", "website": "https://www.nvidia.com/", "reference_length": 5, "level": "easy"}
{"task_id": "f27b393bbd2082f92b566270c4b74fe6", "confirmed_task": "Find a large van for sale from the year 2024 or newer with up to 10,000 miles.", "website": "https://www.parkers.co.uk/", "reference_length": 7, "level": "medium"}
{"task_id": "ba01ea557b73f864c35ebba0dd6f3cb2", "confirmed_task": "Find the top-rated hotel in Manhattan, NY, suitable for 4 guests, and identify the fastest public transportation option from the hotel to LGA airport.", "website": "https://www.google.com/maps/", "reference_length": 14, "level": "hard"}
{"task_id": "662ae0f2d3ac851dbcdd245f908277e3", "confirmed_task": "What is the second stop among the best stops along the road trip from Yellowstone National Park to Las Vegas?", "website": "https://wanderlog.com/", "reference_length": 5, "level": "easy"}
{"task_id": "461ab9b0c7b20ac5f912704480979c65", "confirmed_task": "Find the NYSE Rule 605 Market Center Files data for July 2024.", "website": "https://www.nyse.com/", "reference_length": 5, "level": "easy"}
{"task_id": "a96fca87a17d792644e736d1d10d3cbe", "confirmed_task": "View the pricing plan for 'Business'. Specifically, we have 100 users. We need a 1PB storage quota and a 50 TB transfer quota.", "website": "https://mega.io/", "reference_length": 5, "level": "easy"}
{"task_id": "2c8ef01a92c71ba9ef2e59bb17eea2b3", "confirmed_task": "If there are any discounts on the Apple Mac Studio, add the one with the largest absolute discount to my cart; otherwise, add the cheapest one.", "website": "https://www.costco.com/", "reference_length": 6, "level": "medium"}
{"task_id": "3084bc225219fcb73dc1cb0f97276c1c", "confirmed_task": "Get quotes for a package weighing 10 lbs with dimensions of 2 inches in length, width, and height, being shipped from Long Beach, 90802 to Portland, 97201.", "website": "https://www.ups.com/", "reference_length": 7, "level": "medium"}
{"task_id": "949dc965a6c23a95663b3bc2ca2c3a8a", "confirmed_task": "Find UA or AA flights from London to New York that arrive between 8:00 PM and 11:00 PM on FlightAware.", "website": "https://www.flightaware.com/", "reference_length": 13, "level": "hard"}
{"task_id": "636b07af4dd97c1793733db1fd1b90b8", "confirmed_task": "Filter handbags to evening bags that are blue, and polyester and cost less than $100.", "website": "https://www.macys.com/", "reference_length": 9, "level": "medium"}
{"task_id": "38203be65401943aea2179c4c680059a", "confirmed_task": "Check the status of bus S92 for any disruptions on new.mta.info.", "website": "https://new.mta.info/", "reference_length": 6, "level": "medium"}
{"task_id": "cf757a775fa1224acfc7998489e199a8", "confirmed_task": "Find a flight from Dublin to anywhere under $100 tomorrow on Ryanair.", "website": "https://www.ryanair.com/", "reference_length": 13, "level": "hard"}
{"task_id": "d8e2a81fa621ce4737e5ea85671b630e", "confirmed_task": "Search for regular weekday jobs around 14810 that I can start within two weeks or three.", "website": "https://hiring.amazon.com/", "reference_length": 13, "level": "hard"}
{"task_id": "63d6866fc000fcb1f153e07604bd1395", "confirmed_task": "What are the Nearby Attractions from the most popular attraction in Hong Kong?", "website": "https://us.trip.com/", "reference_length": 8, "level": "medium"}
{"task_id": "199be0b54a436daee74247971fc684ee", "confirmed_task": "Add a Macy's Happy Birthday E-Gift Card worth $50 from Shak to my cart, with the birthday wish message \"Happy birthday, wish you many more years to come\", addressed to christene (christenson@gmail.com).", "website": "https://www.macys.com/", "reference_length": 11, "level": "hard"}
{"task_id": "c00437fd76a7a83b57f3dc4e5dbc41f8", "confirmed_task": "Check the most recent full-time medical health and safety jobs, requiring 1-3 years of industry experience available in the US.", "website": "https://www.amazon.jobs/", "reference_length": 8, "level": "medium"}
{"task_id": "fc53ddd3421411a41c1020a3fdc84ec4", "confirmed_task": "I want to purchase an open-box Samsung Galaxy S25 Plus in excellent condition and trade in a gray Galaxy S20 5G (Verizon), with a perfect screen, in good condition. How much would it cost?", "website": "https://www.bestbuy.com/", "reference_length": 17, "level": "hard"}
{"task_id": "9d46ccb915eff39ee1ae1e7328f5f20d", "confirmed_task": "Get a quote for the fastest shipping available for 5 lbs with dimensions of 4 inches in length, width, and height from New York, NY 10001, USA to Truckee, California 96162, USA.", "website": "https://www.ups.com/", "reference_length": 8, "level": "medium"}
{"task_id": "d1970c16271496cbbe166ecbecc0a1d8", "confirmed_task": "I'm 25 and located in Texas. Shop for 2020 made dry red wine made in United States priced between 15-20 dollars and add 5 bottles to the cart.", "website": "https://macyswineshop.com/", "reference_length": 13, "level": "hard"}
{"task_id": "7211af65d266402f99499053924262e9", "confirmed_task": "View the most recent job posting for a full-time pharmacy position in the US.", "website": "https://www.amazon.jobs/", "reference_length": 8, "level": "medium"}
{"task_id": "4464a8421f8bc8786524a499258dfad3", "confirmed_task": "Check the specifications of the best-selling HP FHD laptop with 16 GB RAM and core i7 running on Windows 11.", "website": "https://www.bestbuy.com/", "reference_length": 12, "level": "hard"}
{"task_id": "f707d765bca668830745d20807d7bee6", "confirmed_task": "Show me the list of young female English Spot rabbits available for adoption in Chicago, IL, within 50 miles.", "website": "https://www.petfinder.com/", "reference_length": 14, "level": "hard"}
{"task_id": "d392e154c1c6ffbb26e2331c3afafc67", "confirmed_task": "Add a $100 Best Buy gift card for a birthday to my cart.", "website": "https://www.bestbuy.com/", "reference_length": 6, "level": "medium"}
{"task_id": "a5c87cc1c94a090c9a8dc2c8b6a125d0", "confirmed_task": "Find the SO2 air quality over the past hour for Maine North, County Cork, Ireland.", "website": "https://www.accuweather.com/", "reference_length": 15, "level": "hard"}
{"task_id": "367d843c640637745e8fafa741cca13b", "confirmed_task": "Find a condo for rent in Houston, TX, with a monthly rent of no more than 30% of an income of $8000. The condo should have a minimum area of 600 square feet, and the move-in date is the 1st of next month.", "website": "https://www.apartments.com/", "reference_length": 15, "level": "hard"}
{"task_id": "84ef883a37af638c3bcf7561f28ce80a", "confirmed_task": "Find the cheapest used hatchback car listing in Madison which has black interiors with a heated seat option and premium sound system.", "website": "https://www.cars.com/", "reference_length": 12, "level": "hard"}
{"task_id": "d9a8689393effeed75ea0866e44e1def", "confirmed_task": "Find the address and phone of the Office of the Inspector General (OIG).", "website": "https://www.justice.gov/", "reference_length": 8, "level": "medium"}
{"task_id": "1bc154377120ec15b18dbabdba49c741", "confirmed_task": "Book 4 tickets in the upper for any Kevin Hart show in New York in the next three months and view ticket prices with estimated fees.", "website": "https://www.stubhub.com/", "reference_length": 12, "level": "hard"}
{"task_id": "28e7574e7bd6d14f36d2988a5ef2bd23", "confirmed_task": "Get a part-time job within 5 miles of Moscow, Idaho in the accommodation and food services industry, as a chef, and show jobs for corporate only.", "website": "https://ohiomeansjobs.ohio.gov/", "reference_length": 12, "level": "hard"}
{"task_id": "1c3b747ae12ccee895745f82e3f2ef8a", "confirmed_task": "Identify the ongoing competition that offers the highest prize and find the code that received the most votes in that competition.", "website": "https://www.kaggle.com/", "reference_length": 11, "level": "hard"}
{"task_id": "d1807551297ac60ecaaabbd2a2ed301a", "confirmed_task": "Find the No.1 children's hospital in the California that specializes in Neonatology.", "website": "https://health.usnews.com/", "reference_length": 8, "level": "medium"}
{"task_id": "7abdceee212151f187ee1a1744c57606", "confirmed_task": "Can you show me the page with the filing fee for a self-petitioned I-140 application?", "website": "https://www.uscis.gov/", "reference_length": 6, "level": "medium"}
{"task_id": "0e5536aaad9d3462b06cf725e6ed535a", "confirmed_task": "Show me the page with average wait times for U.S. citizens arriving at Raleigh-Durham International Airport on 2025-03-12.", "website": "https://www.cbp.gov/", "reference_length": 11, "level": "hard"}
{"task_id": "bc2ce7f206045dd2d322e5695a947219", "confirmed_task": "Estimate the federal income tax I would owe on $158,500 of taxable income in ZIP code 97007, filing as single.", "website": "https://smartasset.com/", "reference_length": 6, "level": "medium"}
{"task_id": "7e6993f2c5cd72c44809024f0bc85dc1", "confirmed_task": "Create a meme with a frog as the background and leave the only text with \"Enjoy your life\".", "website": "https://imgur.com/", "reference_length": 8, "level": "medium"}
{"task_id": "a48e2f1ee8d87eaeea56fe5e730427e6", "confirmed_task": "Pass the first trending chess puzzle.", "website": "https://www.chess.com/", "reference_length": 7, "level": "medium"}
{"task_id": "dd44c665cec1e9c929a4c5f074e7844a", "confirmed_task": "Find parking near the San Francisco Museum of Modern Art from June 18, 1:00 PM to 5:00 PM. I'm driving a Ford F-150 and need a garage that allows in-and-out privileges. If there are multiple options, show me the details of the one with the lowest price.", "website": "https://spothero.com/", "reference_length": 17, "level": "hard"}
{"task_id": "99daaed9a83c266341d28aa40067d376", "confirmed_task": "Find the most popular board game on the 'The Hotness' list that has a rating above 7.5 and is suitable for 2 players.", "website": "https://boardgamegeek.com/", "reference_length": 5, "level": "easy"}
{"task_id": "7072d09436972a5d5fe7476e3e9f1559", "confirmed_task": "Show me the comparison of the first two personal credit cards that do not charge foreign transaction fees.", "website": "https://www.americanexpress.com/", "reference_length": 10, "level": "medium"}
{"task_id": "2c20d87a046fadcb6ff07ee877bfbf37", "confirmed_task": "Open the form 8843 for tax year 2022.", "website": "https://www.irs.gov/", "reference_length": 8, "level": "medium"}
{"task_id": "753f372c189d3b306623cb0c65b50320", "confirmed_task": "Compare the U.S. ETP Odd Lot Rate (%) between Quartile 1 and Quartile 4, viewing quartiles by price, and display the chart with a logarithmic scale on the vertical axis.", "website": "https://www.sec.gov/", "reference_length": 9, "level": "medium"}
{"task_id": "733f1d8bf79d5bc2240c5357f928ffff", "confirmed_task": "Find the cheapest travel deal or discount to Thailand that lasts more than 10 days, departs in next month, and show the total price.", "website": "https://www.tourradar.com/", "reference_length": 10, "level": "medium"}
{"task_id": "f05e87c5b92d9869e08806103c1c15a1", "confirmed_task": "Find all startup companies from the 2022 and 2023 Y Combinator batches that are based in France and currently have job openings.", "website": "https://www.ycombinator.com/", "reference_length": 12, "level": "hard"}
{"task_id": "3ef64f34eae59c9fac7ee9a4f18b4a0c", "confirmed_task": "Find and open an animal learning course on YouTube Kids for my 6-year-old without login in. As a parent born in 1992, I would prefer not to enable search.", "website": "https://www.youtube.com/", "reference_length": 16, "level": "hard"}
{"task_id": "f158345f8489e0d1d91e28768c39bca1", "confirmed_task": "Estimate the total cost (with basic support) of using 5 million input tokens and 5 million output tokens each for GPT-4o and GPT-4o Mini, both deployed in the US/EU Data Zones under Standard (On-Demand) in the East US region.", "website": "https://azure.microsoft.com/", "reference_length": 13, "level": "hard"}
{"task_id": "1ab384fb3a791edfb410213cc6b82151", "confirmed_task": "Show me the result of a proton emission decay for a Beryllium nucleus with 6 protons and 4 neutrons in the simulation.", "website": "https://phet.colorado.edu/", "reference_length": 13, "level": "hard"}
{"task_id": "1223b07536a87e0170ff87cbbebd1d3c", "confirmed_task": "Complete a multiplication quiz on https://www.coolmath4kids.com/, covering multiplication facts for 11-12. The quiz should consist of 10 questions, with unlimited time allowed for each. The goal is to achieve a perfect score of 10 out of 10.", "website": "https://www.coolmath4kids.com/", "reference_length": 24, "level": "hard"}


================================================
FILE: packages/evals/datasets/webtailbench/WebTailBench_data.jsonl
================================================
{"id":"united_13","category":"flights","ques":"What is the price difference between economy and business class on United Airlines direct flights from Chicago to São Paulo from 11/24/2025 to 12/14/2025? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"ryanair_55","category":"flights","ques":"How many seats with extra legroom are available on Ryanair from Birmingham, UK to Porto, Portugal flying out 11/23/2025 and coming back 11/18/2025? If there are no available flights for those dates or this is not possible, please indicate that in your answer\r","web":""}
{"id":"westjet_47","category":"flights","ques":"What is the checked baggage allowance and any associated fees for WestJet flights from Waterloo, Ontario to Calgary, Alberta September 10, 2026 - September 27, 2026 round trip? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"airasia_88","category":"flights","ques":"How much does it cost to select a window seat on a direct AirAsia flight from Singapore to Langkawi from November 24 to November 27? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"jal_61","category":"flights","ques":"What meal options are available in premium economy on Japan Airlines from Dallas/Fort Worth to Singapore leaving on April 23 returning May 3? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"cathaypacific_59","category":"flights","ques":"How much would it cost to upgrade from economy to business class on Cathay Pacific from Manila to Hong Kong November 17 - December 12? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"alitalia_37","category":"flights","ques":"What are the flight duration and number of daily flights with ITA from Rome to Naples leaving on February 23 returning March 18? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"jetstar_22","category":"flights","ques":"What is the cancellation and change fee policy for Jetstar from Darwin to Adelaide in a month for a two week trip? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"alaskaair_6","category":"flights","ques":"How many exit row seats are still available on Alaska Airlines flights from Seattle, WA to Honolulu, HI 11/29/2025 - 12/03/2025? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"easyjet_87","category":"flights","ques":"What is the total cost including all fees and taxes for the cheapest EasyJet flight from Palma de Mallorca to Newcastle December 3 - December 23? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"jetstar_10","category":"flights","ques":"Does Jetstar offer any bundle deals or packages for flights from Adelaide to Sunshine Coast November 18 - November 25 round trip? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"singaporeair_9","category":"flights","ques":"Can you help me find just the flight numbers of a Singapore Airlines flight from London (LHR) to Sydney (SYD) via Singapore (SIN) leaving July 2 and coming back July 28? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"spirit_9","category":"flights","ques":"How much more expensive is a \"Big Front Seat\" compared to standard economy on Spirit Airlines from Houston to Los Angeles beginning March 5 till March 20? If there are no available flights for those dates, please indicate that in your answer\r","web":""}
{"id":"goindigo_52","category":"flights","ques":"How much are business class seats on IndiGo from Sharjah (SHJ) to Delhi (DEL) outbound on January 13 returning January 19, if available? If there are no available flights for those dates or business class is not available, please indicate that in your answer\r","web":""}
{"id":"thaiairways_13","category":"flights","ques":"Book a flight with Thai Airways from Bangkok, Thailand to Singapore. outbound on November 19 returning December 4. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"vueling_15","category":"flights","ques":"Book a flight with Vueling from Birmingham, UK to Barcelona, Spain departing November 28 and returning December 16. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"turkishairlines_11","category":"flights","ques":"Book a round-trip flight with Turkish Airlines from Istanbul Airport (IST) to John F. Kennedy International Airport (JFK) for a two week trip starting the upcoming Saturday. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"airasia_50","category":"flights","ques":"Book a flight with AirAsia from Hong Kong to Manila leaving December 2 and coming back December 8. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"britishairways_11","category":"flights","ques":"Book a round-trip flight with British Airways from Manchester Airport to London Heathrow from the upcoming Friday for four days. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"suncountry_2","category":"flights","ques":"Book a flight with Sun Country Airlines from Duluth, MN to Phoenix, AZ from January 17 to January 31. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"thaiairways_9","category":"flights","ques":"Book a flight with Thai Airways from Bangkok to London departing November 16 and returning November 26. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"lufthansa_39","category":"flights","ques":"Book a flight with Lufthansa from Frankfurt, Germany to Tel Aviv, Israel beginning November 18 till November 30. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"suncountry_9","category":"flights","ques":"Book a flight with Sun Country Airlines from Tampa, FL to Dallas, TX outbound on February 9 returning February 28. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"klm_9","category":"flights","ques":"Book a flight with KLM from Lagos, Nigeria to Frankfurt, Germany flying out 11/18/2025 → coming back 11/25/2025. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"jetstar_82","category":"flights","ques":"Book a flight with Jetstar from Brisbane to Perth from 03/20/2026 → 04/03/2026. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"aircanada_54","category":"flights","ques":"Book a flight with Air Canada from Vancouver to Penticton June 9 - July 4. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"southwest_18","category":"flights","ques":"Book a flight with Southwest Airlines from Portland, OR to Salt Lake City, UT flying out 05/15/2026 → coming back 05/17/2026. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"allegiantair_18","category":"flights","ques":"Book a flight with United Airlines from Houston to Newark, NJ February 11 - March 2. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"airasia_7","category":"flights","ques":"Book a round-trip flight with Delta from Boston, MA to San Francisco, CA outbound in the Saturday after next week. Make the round-trip be two weeks length. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"philippineairlines_45","category":"flights","ques":"Book a flight with Philippine Airlines from Manila to Singapore from November 16 to December 15. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"aircanada_27","category":"flights","ques":"Book a flight with Air Canada from Toronto, ON to New York City, NY leaving on December 10 returning January 7. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"singaporeair_41","category":"flights","ques":"Book a flight with Singapore Airlines from Singapore to Naha, Japan beginning February 10 till February 17. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"suncountry_12","category":"flights","ques":"Book a flight with Sun Country Airlines from San Francisco (SFO) to Minneapolis (MSP) December 18- January 3 round trip. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"lot_5","category":"flights","ques":"Book a flight with LOT Polish Airlines from Warsaw, Poland to New York City, USA March 25 - April 22 round trip. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"allegiantair_53","category":"flights","ques":"Book a flight with Allegiant Air from Asheville, NC to Boston, MA leaving on November 22 returning December 12. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"spirit_5","category":"flights","ques":"Book a Spirit Airlines flight from BWI airport to Newark Liberty International Airport (EWR) beginning May 2 till June 2. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"malaysiaairlines_95","category":"flights","ques":"Book a flight with Malaysia Airlines from Kuala Lumpur to Kathmandu outbound on March 4 returning March 21. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"swiss_48","category":"flights","ques":"Book a Swiss Airlines flight to Mumbai from Zurich outbound on November 22 returning December 12. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"iberia_41","category":"flights","ques":"Book a flight for two people with Iberia from Madrid, Spain to Santiago, Chile beginning July 17 till August 11. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"vueling_28","category":"flights","ques":"Book a flight with Vueling from London to Asturias Airport (OVD) from May 22 to  June 17. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"ana_22","category":"flights","ques":"Book a flight with ANA from Singapore to Fukuoka March 24 - March 27. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"thaiairways_11","category":"flights","ques":"Book a flight with Thai Airways from Thailand to Sydney, Australia from November 16 through December 11. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"wizzair_96","category":"flights","ques":"Book a flight with Wizz Air from Larnaca, Cyprus to Athens, Greece outbound on February 9 returning February 21. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"jetstar_66","category":"flights","ques":"Book a cheap flight with Jetstar from Sydney to Hobart outbound on December 20 returning January 6. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"klm_21","category":"flights","ques":"Book a flight with KLM from Geneva, Switzerland to Osaka, Japan from 11/22/2025 → 11/28/2025. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"iberia_27","category":"flights","ques":"Book a flight with Iberia from Alicante to Funchal leaving on March 11 returning March 25. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"koreanair_0","category":"flights","ques":"Book a cheap flight with Korean Air from Los Angeles, CA to Seoul, South Korea from November 30 to December 30. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"thaiairways_18","category":"flights","ques":"Book a VTL flight with Thai Airways from Bangkok to Singapore leaving on May 1 returning May 21. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"jetblue_48","category":"flights","ques":"Book a flight with JetBlue from Orlando, FL to Denver, CO from December 19 through January12. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"goindigo_24","category":"flights","ques":"Book a flight with IndiGo from Bhubaneswar (BBSR) to Delhi (DEL) from February 20 to March 3. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"aerlingus_93","category":"flights","ques":"Book a direct flight with Aer Lingus from Dublin to Orlando outbound on December 7 returning December 22. If there are no available flights for those dates or the booking is not possible, please indicate that in your answer\r","web":""}
{"id":"samsung_9702","category":"shopping_head","ques":"I want to buy the Samsung Galaxy Tab S11+ 256GB Wi-Fi from Samsung.\r","web":""}
{"id":"amazon_8235","category":"shopping_head","ques":"Can you help me purchase the Electrosport ESR 150 from Amazon?\r","web":""}
{"id":"amazon_9969","category":"shopping_head","ques":"I'm looking to buy Disney Grumpy stuffed plush toy from Amazon.\r","web":""}
{"id":"underarmour_6889","category":"shopping_head","ques":"I need to purchase Under Armour Men's Project Rock BSR size 8 training shoes from Under Armour.\r","web":""}
{"id":"publix_9146","category":"shopping_head","ques":"Could you help me order Febreze Air Freshener from publix for delivery (use 32204 zip code for the store)?\r","web":""}
{"id":"rockauto_4460","category":"shopping_head","ques":"I'd like to get an E450 parking brake rotor and brake pad kit from RockAuto.\r","web":""}
{"id":"underarmour_3963","category":"shopping_head","ques":"Can you order Under Armour kids' lunch boxes from Under Armour for me?\r","web":""}
{"id":"rockauto_6656","category":"shopping_head","ques":"Help me buy a radiator for a 1995 Ford F-350 Powerstroke 7.3 from RockAuto.\r","web":""}
{"id":"hobbylobby_351","category":"shopping_head","ques":"I'm trying to purchase 1/4-inch square hardwood dowels from Hobby Lobby.\r","web":""}
{"id":"overstock_8717","category":"shopping_head","ques":"I want to order a wall-hung bathroom sink (14\" x 12\") from Overstock.\r","web":""}
{"id":"publix_2256","category":"shopping_head","ques":"Can you help me buy a pack of organic broccoli florets from publix for delivery? (use 32204 zip code for the store)\r","web":""}
{"id":"amazon_1934","category":"shopping_head","ques":"I need to get The Witches movie (widescreen edition) from Amazon.\r","web":""}
{"id":"bestbuy_5569","category":"shopping_head","ques":"I'm looking for a refrigerator with a built-in water dispenser from Best Buy.\r","web":""}
{"id":"ebay_1007","category":"shopping_head","ques":"I'd like to purchase the Ninco BMW Amprex from eBay.\r","web":""}
{"id":"sears_4887","category":"shopping_head","ques":"Can you help me order a 30-inch Café induction cooktop on sale from Sears?\r","web":""}
{"id":"ebay_8268","category":"shopping_head","ques":"I want to buy a 1939 issue of Adventure magazine from eBay.\r","web":""}
{"id":"bestbuy_8406","category":"shopping_head","ques":"I need to order a 20-foot printer cable from Best Buy.\r","web":""}
{"id":"westelm_7538","category":"shopping_head","ques":"I'm looking to get a green rug of size 8'x10' or something close from West Elm.\r","web":""}
{"id":"amazon_7859","category":"shopping_head","ques":"Could you help me buy Storm Fury Book 1 from Amazon?\r","web":""}
{"id":"rei_4150","category":"shopping_head","ques":"I want to purchase the Currex Insole M size from REI.\r","web":""}
{"id":"ikea_4872","category":"shopping_head","ques":"I'm looking for the cheapest queen size mattress from Ikea\r","web":""}
{"id":"gap_3164","category":"shopping_head","ques":"I need to buy white Modern V-Neck T-Shirt m size from Gap\r","web":""}
{"id":"sears_6088","category":"shopping_head","ques":"Can you help me get the cheapest 18 cu ft freezer from Sears?\r","web":""}
{"id":"homedepot_7304","category":"shopping_head","ques":"Purchase the DeWalt Atomic Sawzall from Home Depot.\r","web":""}
{"id":"amazon_4045","category":"shopping_head","ques":"Purchase the book \"El vuelo de una abeja\" from Amazon.\r","web":""}
{"id":"amazon_970","category":"shopping_head","ques":"Purchase 20 disposable plastic bowls on amazon\r","web":""}
{"id":"hobbylobby_299","category":"shopping_head","ques":"Buy some metal cake stand from Hobby Lobby\r","web":""}
{"id":"zappos_9900","category":"shopping_head","ques":"Purchase navy Clarks shoes for women size 8 from Zappos.\r","web":""}
{"id":"publix_4839","category":"shopping_head","ques":"Buy a Jimmy Dean pork sausages from Publix for delivery (use 32204 zip code for the store).\r","web":""}
{"id":"overstock_9388","category":"shopping_head","ques":"Purchase Steve Madden tall women's boots 9 size\r","web":""}
{"id":"underarmour_7483","category":"shopping_head","ques":"Purchase the Under Armour mens beanie from Under Armour.\r","web":""}
{"id":"potterybarn_7344","category":"shopping_head","ques":"Purchase a light color around 90' long Chesterfield-style sectional sofa from Pottery Barn.\r","web":""}
{"id":"potterybarn_1237    ","category":"shopping_head","ques":"Help me purchase a rectangular drop leaf dining table from Pottery Barn that's at least 54\" long.\r","web":""}
{"id":"kohls_8946","category":"shopping_head","ques":"Purchase pink Skechers girls’ slip-on shoes size 13 from Kohl’s.\r","web":""}
{"id":"rockauto_1225","category":"shopping_head","ques":"Purchase intake coolant hoses (molded, silicone) from RockAuto.\r","web":""}
{"id":"wholefoodsmarket_5324","category":"shopping_head","ques":"Purchase 6 fcans of zero-sugar cola from Whole Foods Market.\r","web":""}
{"id":"overstock_9756","category":"shopping_head","ques":"Purchase ~20\" wide by ~30\" high medicine cabinets from Overstock.\r","web":""}
{"id":"amazon_1230","category":"shopping_head","ques":"Purchase configuration of RT81 Turntable with AT95E Cartridge (no more than 350$ configuration) from Amazon\r","web":""}
{"id":"lowes_8758","category":"shopping_head","ques":"Purchase a cotoneaster plant from Lowe's\r","web":""}
{"id":"ikea_2219","category":"shopping_head","ques":"Purchase a hammock chair with stand from IKEA.\r","web":""}
{"id":"westelm_19","category":"shopping_head","ques":"Purchase the Gemini Bed from West Elm.\r","web":""}
{"id":"target_4231","category":"shopping_head","ques":"Purchase 12 cups of Snack Pack sugar-free pudding from Target.\r","web":""}
{"id":"sears_4759","category":"shopping_head","ques":"Purchase Lush Decor Bohemian Stripe window curtains in turquoise and orange from Sears.\r","web":""}
{"id":"ulta_1473","category":"shopping_head","ques":"Purchase the Dashing Dive Glaze Starter Kit from Ulta.\r","web":""}
{"id":"overstock_2959","category":"shopping_head","ques":"Purchase a cheapest Costway dog bed from Overstock with shipping to Canada.\r","web":""}
{"id":"underarmour_784","category":"shopping_head","ques":"Purchase the Under Armour Men's UA Base 4 long sleeve M size from Under Armour.\r","web":""}
{"id":"wholefoodsmarket_4455","category":"shopping_head","ques":"Purchase 4 bottles of Belvoir Lemonade from Whole Foods.\r","web":""}
{"id":"lowes_6063","category":"shopping_head","ques":"Purchase 4 tier chrome shelving from Lowe’s approximately 35 inches width and 50 inches height.\r","web":""}
{"id":"target_6682","category":"shopping_head","ques":"Purchase Aveeno sunscreen lotion with 60 spf from Target.\r","web":""}
{"id":"michaels_2250","category":"shopping_head","ques":"Purchase baby fabric sold by the half yard from Michaels.\r","web":""}
{"id":"publix_8722","category":"shopping_head","ques":"Have Publix deliver Heinz Apple Cider Vinegar (use 32204 zip code for the store).\r","web":""}
{"id":"crateandbarrel_2072","category":"shopping_head","ques":"Purchase a ceramic photo frame from Crate & Barrel.\r","web":""}
{"id":"nordstrom_5374","category":"shopping_head","ques":"Purchase women's full-length leather coat S size less than 200$ from Nordstrom.\r","web":""}
{"id":"publix_3096","category":"shopping_head","ques":"Find prepared pasta salads from publix for delivery (use 32204 zip code for the store).\r","web":""}
{"id":"petsmart_5650","category":"shopping_head","ques":"Purchase a 20-gallon fish tank from PetSmart.\r","web":""}
{"id":"kohls_7716","category":"shopping_head","ques":"Purchase a Starter Pittsburgh Steelers hoodie from Kohl's.\r","web":""}
{"id":"eventbrite_tickets_book_93","category":"things_to_do","ques":"Submit a request form to book a tasting tour at St. Michaels Winery in maryland (but don't hit \"send\"). Then give me their phone number to confirm.\r","web":""}
{"id":"eventbrite_tickets_book_97","category":"things_to_do","ques":"Book tickets for the next murder mystery dinner event for me and my wife in Ocala, Florida and tell me the total price\r","web":""}
{"id":"eventbrite_tickets_book_110","category":"things_to_do","ques":"What is the next recreational event (like cherry blossom festival) coming up on the City of Monterey Park, California municipal calendar?\r","web":""}
{"id":"tripadvisor_find_128","category":"things_to_do","ques":"Find 2 ziplining places in Marylan, and provide their address. Which is closer to Baltimore?\r","web":""}
{"id":"tripadvisor_find_162","category":"things_to_do","ques":"Find a deep sea fishing tour option on Viator in Moorea, Society Islands and give me the total cost and start time of the tour\r","web":""}
{"id":"eventbrite_tickets_book_126","category":"things_to_do","ques":"Find the next board of commissioners meeting for the city of Covington, Kentucky and tell me where I can livestream it at\r","web":""}
{"id":"alltrails_plan_a_trip_13","category":"things_to_do","ques":"Buy a one day MONT BLANC MultiPass for hiking for the next available date and tell me the price, for one adult\r","web":""}
{"id":"alltrails_find_243","category":"things_to_do","ques":"What is the top rated hiking trail in Creekside Park, Salinas, California and provide details on the length and difficulty\r","web":""}
{"id":"eventbrite_tickets_book_92","category":"things_to_do","ques":"Register me for the turkey trot event coming up in Coppell, Texas, tell me how much it costs and when it is.\r","web":""}
{"id":"hipcamp_find_111","category":"things_to_do","ques":"I want to book a camping spot at Bridge Bay in Yellowstone for the next available slot; how much is the nightly rate?\r","web":""}
{"id":"tripadvisor_question_answering_148","category":"things_to_do","ques":"help me register for the new years day 5k in chesapeake city, MD on raceroster.com. Then tell me who is the event contact.\r","web":""}
{"id":"eventbrite_tickets_book_51","category":"things_to_do","ques":"help me plan a weekend going to events with my kids on discover baltimore county websites\r","web":""}
{"id":"tripadvisor_question_answering_185","category":"things_to_do","ques":"Write a review on tripadvisor giving the NCL excursion to Volcano Winery on the Island of Hawaii a 4 start review\r","web":""}
{"id":"sixflags_find_71","category":"things_to_do","ques":"What is the price of a military discount ticket for Six Flags at Darien Lake, New York and then try to book a ticket. Stop once I am asked to login to verify my military membership.\r","web":""}
{"id":"tripadvisor_recommend_158","category":"things_to_do","ques":"Reserve an airboat ride with more than 500 reviews in Kissimmee, Florida on tripadvisor\r","web":""}
{"id":"tripadvisor_general_activity_20","category":"things_to_do","ques":"Provide information on visiting historic sites in Camden, Maine, including one must-see landmark or site\r","web":""}
{"id":"disneyworld.disney.go_find_180","category":"things_to_do","ques":"Find out the opening hours and ticket prices for Disney's Animal Kingdom Theme Park in Orlando, Florida.\r","web":""}
{"id":"eventbrite_tickets_book_118","category":"things_to_do","ques":"book tickets for the next Greater Haitian-American Chamber of Commerce event near tampa, FL\r","web":""}
{"id":"alltrails_find_206","category":"things_to_do","ques":"What are the alerts, if any, for the petrified forest loop trail on alltrails.com\r","web":""}
{"id":"tripadvisor_recommend_9","category":"things_to_do","ques":"Submit a form to plan a safari trip in johannesburg  on jacadatravel.com for a family of 4 with 2 kids, including a private dinner with a budget of $15000\r","web":""}
{"id":"tripadvisor_find_153","category":"things_to_do","ques":"Buy tickets for the St. Petersburg Pirate Museum in Florida, and inform me of the including visiting hours and total price for 2 adults.\r","web":""}
{"id":"metmuseum_find_24","category":"things_to_do","ques":"Buy tickets for the Met on the next available day, using 11201 as the zipcode for discounts and pay only the ticket price.\r","web":""}
{"id":"smithsonianmag_question_answering_24","category":"things_to_do","ques":"Find the oldest Nez Perce site on the Salmon River and then tell me what road I would take to get there from Cottonwood, ID\r","web":""}
{"id":"eventbrite_tickets_book_37","category":"things_to_do","ques":"Find and book a kayaking event in Winter Haven, Florida.\r","web":""}
{"id":"eventbrite_tickets_book_71","category":"things_to_do","ques":"what are the next three events happening at miami beach convention center\r","web":""}
{"id":"tripadvisor_find_286","category":"things_to_do","ques":"book tickets for the next dinner show at Pigeon Forge, Tennessee and tell me the price\r","web":""}
{"id":"eventbrite_tickets_book_109","category":"things_to_do","ques":"buy tickets for a sumo wrestling event in tokyo\r","web":""}
{"id":"eventbrite_tickets_book_66","category":"things_to_do","ques":"Book tickets for a murder mystery dinner in Chambersburg, Pennsylvania\r","web":""}
{"id":"sixflags_question_answering_79","category":"things_to_do","ques":"Find out operating hours and ticket prices for Six Flags New England\r","web":""}
{"id":"tripadvisor_general_activity_194","category":"things_to_do","ques":"Plan an airboat tour at Lake Trafford in Florida and check if alligator sightings are guaranteed\r","web":""}
{"id":"eventbrite_tickets_book_81","category":"things_to_do","ques":"tell me when daffodil day at the garden club of virginia is and add it to my calendar if you can\r","web":""}
{"id":"tripadvisor_find_250","category":"things_to_do","ques":"Locate and provide options for ziplining in Bavaria, Germany.\r","web":""}
{"id":"hipcamp_question_answering_4","category":"things_to_do","ques":"order a nonresident Annual Park Pass from new jersey state park service\r","web":""}
{"id":"alltrails_find_223","category":"things_to_do","ques":"Find the best hiking trails in Pendleton, Oregon and include details such as trail length and difficulty\r","web":""}
{"id":"eventbrite_tickets_book_102","category":"things_to_do","ques":"Find a cooking class in Bethesda, Maryland and book a session if available\r","web":""}
{"id":"eventbrite_tickets_book_174","category":"things_to_do","ques":"Find the price and availability for tours of Waverly Hills Sanatorium in Kentucky, and help me book tickets if possible.\r","web":""}
{"id":"disneyworld.disney.go_plan_a_trip_2","category":"things_to_do","ques":"Plan a visit to Disney World in Orlando, Florida, including ticket options and must-see attractions\r","web":""}
{"id":"sixflags_general_activity_11","category":"things_to_do","ques":"Check for opening hours and ticket prices for the Wild Safari at Six Flags in New Jersey\r","web":""}
{"id":"eventbrite_tickets_book_45","category":"things_to_do","ques":"what are the upcoming events at pershing square, LA on bandsintown websites\r","web":""}
{"id":"eventbrite_recommend_220","category":"things_to_do","ques":"What free events or activities are happening in Ithaca, New York this weekend?\r","web":""}
{"id":"alltrails_find_232","category":"things_to_do","ques":"buy a backcountry permit for Thunder River and Deer Creek trail at the grand canyon, or tell me when I can apply if not available.\r","web":""}
{"id":"metmuseum_question_answering_49","category":"things_to_do","ques":"What are the current exhibits at the Metropolitan Museum of Art in New York City, New York?\r","web":""}
{"id":"eventbrite_tickets_book_95","category":"things_to_do","ques":"tell me the date and time of the next event at Fort Gibson historic site in Oklahoma, and what to expect at the event.\r","web":""}
{"id":"eventbrite_tickets_book_1","category":"things_to_do","ques":"sign up for a family membership for the oklahoma historical society\r","web":""}
{"id":"sixflags_general_activity_16","category":"things_to_do","ques":"buy a season pass to hurricane harbor in arlington tx and tell me the price\r","web":""}
{"id":"tiqets_tickets_book_4","category":"things_to_do","ques":"purchase tickets to the Azulejo Tile Museum directly from their website\r","web":""}
{"id":"trailforks_question_answering_3","category":"things_to_do","ques":"Check the current conditions of the Lake Eiler Trail and report any closures or hazards.\r","web":""}
{"id":"eventbrite_tickets_book_136","category":"things_to_do","ques":"buy tickets for the next upcoming Edgar Allan Poe speakeasy event (in whichever city)\r","web":""}
{"id":"alltrails_find_282","category":"things_to_do","ques":"Find the top 3 hiking trails in Pike National Forest and provide a table detailing their difficulty level, number of reviews, and length in miles.\r","web":""}
{"id":"eventbrite_tickets_book_112","category":"things_to_do","ques":"Book tickets for the underground NYC tour known as 'Empire Beneath the Streets' in New York City, New York\r","web":""}
{"id":"recreation.gov_question_answering_26","category":"things_to_do","ques":"Find the hours of operation and available activities at Colter Bay Visitor Center in Wyoming.\r","web":""}
{"id":"tripadvisor_recommend_275","category":"things_to_do","ques":"Recommend activities or attractions to visit near Yankee Stadium in Bronx, New York before a Yankee game\r","web":""}
{"id":"tripadvisor_find_101","category":"things_to_do","ques":"buy tickets for family of 4 (2 kids) at the denver museum of nature and science\r","web":""}
{"id":"tripadvisor_question_answering_278","category":"things_to_do","ques":"which time slot in the next upcoming Saturday has the most availability at the denver museum of nature and science\r","web":""}
{"id":"tripadvisor_find_190","category":"things_to_do","ques":"book a ziplining tour at fox fire adventure park in Sevierville, TN\r","web":""}
{"id":"hipcamp_recommend_5","category":"things_to_do","ques":"What are the best camping parks in Languedoc-Roussillon, France, and what amenities do they offer?\r","web":""}
{"id":"eventbrite_tickets_book_77","category":"things_to_do","ques":"buy 1 colorado resident and another non-resident ticket to the denver art museum on the next available Tuesday\r","web":""}
{"id":"tripadvisor_plan_a_trip_118","category":"things_to_do","ques":"buy tickets a tour of teatro colon and then dinner/tango show in La Ventana, Buenos Aires\r","web":""}
{"id":"eventbrite_tickets_book_83","category":"things_to_do","ques":"buy tickets to the next wine festival anywhere in the US -- I really need more wine\r","web":""}
{"id":"tripadvisor_plan_a_trip_162","category":"things_to_do","ques":"Plan a road trip itinerary with interesting places to stop between Glacier National Park and Red Lodge, Montana\r","web":""}
{"id":"eventbrite_find_40","category":"things_to_do","ques":"rsvp to an event involving food at visitlakegeneva.com\r","web":""}
{"id":"eventbrite_tickets_book_128","category":"things_to_do","ques":"buy tickets for the next weekend show at the Barrymore Theatre in Fort Lee, New Jersey\r","web":""}
{"id":"tiqets_tickets_book_9","category":"things_to_do","ques":"buy next available tickets for La Lonja de la Seda in Valencia, Spain\r","web":""}
{"id":"eventbrite_tickets_book_2","category":"things_to_do","ques":"book tickets for the next event in Grapevine, TX on eventbrite so I can plan my weekend\r","web":""}
{"id":"tripadvisor_plan_a_trip_226","category":"things_to_do","ques":"Help me plan a trip with recommendations for hotels, day tours, and attractions in Palawan, Philippines\r","web":""}
{"id":"eventbrite_tickets_book_170","category":"things_to_do","ques":"book tickets to visit the chrysler building observation deck in NYC\r","web":""}
{"id":"tiqets_tickets_book_15","category":"things_to_do","ques":"book tickets to the Pinacoteca di Brera in Milan, Italy on their official site\r","web":""}
{"id":"alltrails_find_23","category":"things_to_do","ques":"Identify the best waterfalls to see while hiking in the Superstition Mountains, Arizona\r","web":""}
{"id":"sixflags_find_48","category":"things_to_do","ques":"Find the operational hours and entry prices for Sky Harbor Waterpark in Phoenix, Arizona\r","web":""}
{"id":"hipcamp_find_90","category":"things_to_do","ques":"Locate the available campgrounds near Little Bighorn Battlefield National Monument in Montana and provide details about the amenities they offer.\r","web":""}
{"id":"eventbrite_tickets_book_57","category":"things_to_do","ques":"which day in the upcoming month is cheapest to buy admission tickets to chicago botanic garden and what is the price?\r","web":""}
{"id":"eventbrite_tickets_book_73","category":"things_to_do","ques":"register for the next open house at the NY campus of the culinary institute of america\r","web":""}
{"id":"disneyworld.disney.go_question_answering_147","category":"things_to_do","ques":"when is the next available day to schedule a divequest at sea base aquarium at epcot and what is the price? Then proceed to book.\r","web":""}
{"id":"eventbrite_tickets_book_67","category":"things_to_do","ques":"sign up for a guided tour at the Leland Stanford mansion for the next available Saturday\r","web":""}
{"id":"tiqets_tickets_book_5","category":"things_to_do","ques":"purchase a ticket to visit the The Odeon of Herodes Atticus in Athens, Greece\r","web":""}
{"id":"eventbrite_tickets_book_76","category":"things_to_do","ques":"book tickets to the next event at the African-American Research Library and Cultural Center, Ft lauderdale FL\r","web":""}
{"id":"alltrails_find_237","category":"things_to_do","ques":"Find the starting point and trail length for hiking Mount Oxford in New Zealand\r","web":""}
{"id":"tripadvisor_find_41","category":"things_to_do","ques":"Find 2 museums located in Iowa City, Iowa, and provide the addresses or websites for them.\r","web":""}
{"id":"eventbrite_tickets_book_74","category":"things_to_do","ques":"Find and book tickets to a dinner show happening this weekend in Memphis, Tennessee\r","web":""}
{"id":"eventbrite_find_279","category":"things_to_do","ques":"Find upcoming Indian or Hindu festivals taking place in Pittsburgh, Pennsylvania and provide details about the events.\r","web":""}
{"id":"mgmgrand.mgmresorts_1","category":"hotels_head","ques":"I need to reserve a room at MGM Grand in Las Vegas, Nevada, this weekend at mgmgrand.mgmresorts.com checking in November 27 until December 9. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"kayak_256","category":"hotels_head","ques":"What's the cheapest room price at Red Roof Inn in St. Louis, Missouri with kayak.com staying from November 23 to December 4? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"caesars_313","category":"hotels_head","ques":"Can you help me book a stay at Harrah's Cherokee in Cherokee, North Carolina using caesars.com 11/25/2025 - 11/27/2025? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"holidayinnclub_211","category":"hotels_head","ques":"How many rooms are available at Holiday Inn Club Scottsdale in Scottsdale, Arizona using holidayinnclub.com from December 6 through December 19? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hilton_248","category":"hotels_head","ques":"I'm looking to get a room at DoubleTree by Hilton Rapid City Downtown Convention Center in Rapid City, South Dakota using hilton.com staying from December 17 to December 30. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"airbnb_437","category":"hotels_head","ques":"What do the taxes and fees amount to for a stay at Bella's House from Twilight in St. Helens, Oregon through airbnb.com 11/13/2025 - 11/25/2025? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"orbitz_8","category":"hotels_head","ques":"I'd like to reserve a room at Legoland Hotel in Carlsbad, California using orbitz.com checking in November 19 - November 21. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"resortsandlodges_43","category":"hotels_head","ques":"Can you help me find a pet-friendly resort in New Jersey for my vacation at resortsandlodges.com from December 18 to January 1? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hotels_131","category":"hotels_head","ques":"What's the price for the cheapest hotel in Edisto Beach, South Carolina at hotels.com 12/18/2025 - 12/28/2025? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"uniquehotels.me_13","category":"hotels_head","ques":"I'm trying to book a unique accommodation in Havelock North, New Zealand through uniquehotels.me from 11/17/2025 → 11/19/2025. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"tripadvisor_347","category":"hotels_head","ques":"How many hotels are available near the Grand Canyon in Las Vegas, Nevada through tripadvisor.com February 3 checking out February 8? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"choicehotels_52","category":"hotels_head","ques":"I need to get a room at Clarion Inn in Idaho Falls, Idaho with choicehotels.com from January 18 through January 31. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"choicehotels_25","category":"hotels_head","ques":"What are the total taxes and fees for a room at Radisson Resort in Miami Beach, Florida at choicehotels.com January 8 checking out January 13? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"motel6_76","category":"hotels_head","ques":"Can you book me a room at Motel 6 in Lenexa, Kansas with motel6.com November 26 - November 30? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hostelworld_27","category":"hotels_head","ques":"I'm looking for a cheap hostel in Mykonos, Greece through hostelworld.com checking in on November 24 and leaving December 6. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"holidayinnclub_103","category":"hotels_head","ques":"Help me reserve a room at Orange Lake Resort by Holiday Inn in Kissimmee, Florida with holidayinnclub.com from December 11 to December 15. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hilton_150","category":"hotels_head","ques":"What's the cheapest available room at Hampton Inn and Suites Albany in Albany, Georgia at hilton.com from 12/10/2025 → 12/15/2025? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"agoda_121","category":"hotels_head","ques":"I want to book a room at SO Sofitel Hua Hin in Hua Hin, Cha-Am, Thailand on Agoda using agoda.com checking in on December 18 and leaving December 23. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"travelocity_36","category":"hotels_head","ques":"How many rooms are still available in Lauderdale-by-the-Sea, Florida using travelocity.com February 4 checking out February 11? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"oyster_72","category":"hotels_head","ques":"I'd like to get a 2-bedroom suite at Ocean Lodge in St. Simons Island using oyster.com checking in January 4 - January 15. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"vrbo_282","category":"hotels_head","ques":"What do the total fees and taxes come to for Harbor House in Treasure Island, Florida through vrbo.com from December 14 to December 16? If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"motel6_83","category":"hotels_head","ques":"Book a room at Motel 6 in Shartlesville, Pennsylvania through motel6.com December 12 checking out December 16.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"ihg_11","category":"hotels_head","ques":"Book a hotel in Green River, Utah at ihg.com January 5 checking out January 17.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"marriott_20","category":"hotels_head","ques":"Book a room at Gaylord Opryland Resort and Convention Center in Nashville, Tennessee with marriott.com from 01/13/2025 → 01/15/2025.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"bestwestern_370","category":"hotels_head","ques":"Book a room at Best Western Wapakoneta Inn in Wapakoneta, Ohio using bestwestern.com staying from December 18 to December 22.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"bluegreenvacations_23","category":"hotels_head","ques":"Book a room at Bluegreen at Tradewinds in Florida with bluegreenvacations.com from December 3 through December 5.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"marriott_490","category":"hotels_head","ques":"Book a room at Courtyard by Marriott Anchorage Airport in Anchorage, Alaska at marriott.com checking in on January 25 and leaving January 31.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hyattinclusivecollection_265","category":"hotels_head","ques":"Book a room at Dreams Onyx Resort & Spa - All Inclusive in the Dominican Republic with hyattinclusivecollection.com checking in December 16, checking out December 27.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"premierinn_26","category":"hotels_head","ques":"Book a Premier Inn hotel Edinburgh City Centre in Scotland using premierinn.com checking in December 3, checking out December 8.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"planethollywoodhotels_25","category":"hotels_head","ques":"Book a room at Planet Hollywood Cancun Resort with Star Class in Cancun, Mexico at planethollywoodhotels.com from December 19 through December 24.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"motel6_32","category":"hotels_head","ques":"Book a room at Motel 6 in Branford, Connecticut using motel6.com staying from November 25 to November 29.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"druryhotels_224","category":"hotels_head","ques":"Book a room at Drury Inn and Suites Columbus Polaris in Columbus, Ohio at druryhotels.com from February 9 through February 22.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hyatt_305","category":"hotels_head","ques":"Book a room at Hyatt Regency Hotel at Orlando International Airport in Orlando, Florida through hyatt.com from 12/06/2025 → 12/19/2025.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"bestwestern_409","category":"hotels_head","ques":"Book a room at Best Western Plus Capitola By-the-Sea Inn & Suites in Capitola, California using bestwestern.com checking in on January 23 and leaving January 25.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"airbnb_192","category":"hotels_head","ques":"Book a place to stay in Plainfield Township, Michigan with airbnb.com checking in December 12 until December 16.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hyatt_115","category":"hotels_head","ques":"Book a room at Hyatt Vacation Club at the Ranahan in Colorado with hyatt.com checking in January 15 - January 25.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"motel6_59","category":"hotels_head","ques":"Book a room at Motel 6 in Harrisburg, Pennsylvania with motel6.com checking in December 4, checking out December 16.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hiltongrandvacations_128","category":"hotels_head","ques":"Book a room at Hilton Grand Vacations in South Lake Tahoe, California through hiltongrandvacations.com arriving 11/20/2025 to 11/25/2025.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"ihg_236","category":"hotels_head","ques":"Book a room at Holiday Inn in Toronto, Ontario, Canada at ihg.com checking in on February 14 and leaving February 16.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"tripadvisor_280","category":"hotels_head","ques":"Book a hotel in Concord, New Hampshire using tripadvisor.com checking in November 19 - November 27.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hilton_312","category":"hotels_head","ques":"Book a room at Homewood Suites in Wallingford, Connecticut with hilton.com checking in January 9 - January 13.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"marriott-hotels.marriott_9","category":"hotels_head","ques":"Book a Marriott hotel with a lounge in Orlando, Florida at marriott-hotels.marriott.com November 19 checking out November 29.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"sandals_14","category":"hotels_head","ques":"Book an all-inclusive stay at Sandals Turks and Caicos through sandals.com staying from Jan 27 to Feb 4.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"kempinski_30","category":"hotels_head","ques":"Book a room at Kempinski Budapest Hotel in Budapest, Hungary at kempinski.com from November 29 through December 6.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"caesars_162","category":"hotels_head","ques":"Book a room at Harrah's Lake Tahoe in Lake Tahoe, Nevada through caesars.com February 6 checking out on the 13.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"bestwestern_354","category":"hotels_head","ques":"Book a room at Best Western Venice Mestre Hotel in Mestre, Italy through bestwestern.com checking in January 17, checking out January 30.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"airbnb_161","category":"hotels_head","ques":"Book a bed and breakfast in Leadville, Colorado using airbnb.com January 4 - January 15.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"bluegreenvacations_66","category":"hotels_head","ques":"Book a stay at Bluegreen Odyssey Dells in Wisconsin Dells, Wisconsin through bluegreenvacations.com checking in February 11 until February 22.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"bestwestern_467","category":"hotels_head","ques":"Book a room at SureStay by Best Western Glendive Yellowstone River in Glendive, Montana with bestwestern.com from November 22 to November 27.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"holidayinnclub_277","category":"hotels_head","ques":"Book a stay at Holiday Inn Vacation Club Orange Lake Resort in Orlando, Florida using holidayinnclub.com December 12 checking out December 18.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hilton_262","category":"hotels_head","ques":"Book a room at Home2 Suites by Hilton in St. Louis, Missouri using hilton.com December 13 - December 20.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"hyatt_335","category":"hotels_head","ques":"Book a room at Hyatt Place Pasadena in California at hyatt.com checking in December 22, checking out December 27.. If the hotel doesn't take reservations for that date or there are no available rooms for that time, please indicate that in your answer\r","web":""}
{"id":"gardenofeatn_1","category":"restaurants_tail","ques":"Find some vegan options at Garden of Eatin in Sacramento, CA.\r","web":""}
{"id":"eatleven_2","category":"restaurants_tail","ques":"Find me a deli in Downtown Denver and its most meat-filled option at the deli.\r","web":""}
{"id":"thekafeneo_1","category":"restaurants_tail","ques":"Find a vegetarian item on the menu for Kafe Neo in Bainbridge\r","web":""}
{"id":"indytoday.6amcity_8","category":"restaurants_tail","ques":"Book a reservation at Yazsh Cafe and Bistro in Indianapolis on Thursday for brunch time.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"antioch.eatatanastasias_1","category":"restaurants_tail","ques":"Book a reservation for two at Anastasia Restaurant in Antioch on November 20 at 11:15 AM.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"queensyardnyc_1","category":"restaurants_tail","ques":"Book a reservation at Rose Room in New York at 10 PM. If it doesn't take reservations or is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"ronskenosha_1","category":"restaurants_tail","ques":"Book a reservation at Ron's Place in Kenosha for the soonest available time.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"portofinoutica_1","category":"restaurants_tail","ques":"Book a brunch reservationfor three at 11 AM on the upcoming Sunday for Mother's Day at Portofino in Utica, NY. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"ophchicagoland_2","category":"restaurants_tail","ques":"What are some famous pancakes on the menu at The Original Pancake House in Hyde Park.\r","web":""}
{"id":"firebowlcafe_1","category":"restaurants_tail","ques":"What are the cheapest rice/noodle dishes featuring meat at Fire Bowl Cafe in McKinney, TX?\r","web":""}
{"id":"theshopsatcolumbuscircle_1","category":"restaurants_tail","ques":"Book a reservation at a restaurant in Time Warner Center at 7 pm on 11/30/25. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"gillhouseny_2","category":"restaurants_tail","ques":"What specials do they have featured at Gill House in Henderson Harbor, NY.\r","web":""}
{"id":"greatwoksecaucus_1","category":"restaurants_tail","ques":"Do they have any spicy beef or chicken dishes available for takeout at Great Wok in Secaucus, NJ\r","web":""}
{"id":"mauihawaii_3","category":"restaurants_tail","ques":"Book a reservation at a restaurant in Lahaina, Maui for the earliest available reservation this week.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"brunchpubcenterville_2","category":"restaurants_tail","ques":"Book a reservation at The Brunch Pub in Centerville for the upcoming Friday at 7 pm. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"aubergeresorts_8","category":"restaurants_tail","ques":"Book a reservation at The Conservatory Restaurant in Newport for Novemeber 26 at 11:15 AM.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"reysolcoffee_1","category":"restaurants_tail","ques":"What is the most expensive dish on the menu for Rey Sol Coffee in Morristown, NJ\r","web":""}
{"id":"duffystavernlg_1","category":"restaurants_tail","ques":"What kinda chicken wings and drinks they got at Duffy's Tavern in Lake George.\r","web":""}
{"id":"restaurantsinsarasota_9","category":"restaurants_tail","ques":"Book a reservation at Gen Korean restaurant in UTC Mall, Sarasota, FL for Tuesday at 6:30 PM. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"tallahasseetimes_1","category":"restaurants_tail","ques":"Book a reservation with outdoor setaing at a 347 Grille in Tallahassee, FL any day over the next three weeknds between 5:30 and 8 pm. Let them know that I have peanut allergies too. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"ritual.co_4","category":"restaurants_tail","ques":"What is the most popular dish on the menu for Java Java Coffee on Fleet Street, London\r","web":""}
{"id":"brennanssportsbar_1","category":"restaurants_tail","ques":"Book a reservation at Brennan's Sports Bar in the Phoenix area on December 2 for the next free slot. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"thecapitalburger_3","category":"restaurants_tail","ques":"Find a vegetarian item on the menu and prices for The Capital Burger in Washington, DC\r","web":""}
{"id":"carinos_2","category":"restaurants_tail","ques":"List some types of lasagna featured at Johnny Carino's in Downey, CA during lunchtime.\r","web":""}
{"id":"gazette_5","category":"restaurants_tail","ques":"What chicken dishes are available at  Masala Mingle Indian Bistro and Bar in Colorado Springs\r","web":""}
{"id":"bestnewyork.us_5","category":"restaurants_tail","ques":"In the upcoming Friday or Saturday, book a reservation for four people at Buffet House in Queens, NY.\r","web":""}
{"id":"mounthorebchamber_1","category":"restaurants_tail","ques":"Make a reservation for four people at Campo Di Bella in Mt Horeb, WI on Nov. 22. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer.\r","web":""}
{"id":"mallsinamerica_7","category":"restaurants_tail","ques":"Book a reservation at SkyDome restaurant for two in Pentagon Row for Novemeber 22nd at 6:00 PM.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"utcsarasota_6","category":"restaurants_tail","ques":"Make a reservation at Isan Thai Restaurant in Sarastoa, FL for a party of 3 at at around 6 PM.  If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"rockawave_1","category":"restaurants_tail","ques":"What are some special drinks or cuisine found at Fitzgerald's Bar in Rockaway, NY ?\r","web":""}
{"id":"sloansrestaurant_1","category":"restaurants_tail","ques":"What are some common American breakfast foods found at Sloan's Restaurant in Indio during its breakfast/lunch time?\r","web":""}
{"id":"mainkitchenma_1","category":"restaurants_tail","ques":"Are there any duck dishes served at Peking House on Carew St in Springfield, MA.\r","web":""}
{"id":"longshots-bar_1","category":"restaurants_tail","ques":"Book a reservation for 6 people at Longshots Bar and Grill in Fairmount Park, IL for Saturday, Novebmer 22 at 7:00 PM.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"wearetravelgirls_3","category":"restaurants_tail","ques":"Book a reservation for a party of 12 at Magnolias in Charleston, SC for a bachelorette party on 12/12/2025 at 8 PM. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"local.starmarket_1","category":"restaurants_tail","ques":"Order two birthday cakes from Star Market Bakery in Quincy, MA. The budget is capped at $100. If there are no two birthday cakes that exceed $100, do not order a cake.\r","web":""}
{"id":"grilledcheeseandcrabcakeco_1","category":"restaurants_tail","ques":"Find a vegetarian item on the menu for The Grilled Cheese and Crab Cake Company in Cocoa Beach\r","web":""}
{"id":"epicureantravelerblog_2","category":"restaurants_tail","ques":"Is Marro's Italian Restaurant in Saugatuck, MI a romantic restaurant? If so, book a reservation for two on November 18 at 7:00 PM.  If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"gulelerestaurant_1","category":"restaurants_tail","ques":"Book a reservation at Gulele Restaurant in Gaithersburg, MD on the upcoming Sunday for weekend brunch at 11:00 AM. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"sinners.co_1","category":"restaurants_tail","ques":"Book a reservation at Sinners Restaurant in Bloomington for lunchtime on 12/19.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"nothingbundtcakes_6","category":"restaurants_tail","ques":"Order a cake from Nothing Bundt Cakes in Lincoln, NE.\r","web":""}
{"id":"sawasdeethaicuisine-asheville_1","category":"restaurants_tail","ques":"Book a reservation at Sawasdee Thai in Asheville, NC on November 21 at 1:00 PM. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"mammamaria_3","category":"restaurants_tail","ques":"Book a reservation at Mamma Maria in the North End, Boston for the upcoming Monday dinnretime.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"foodieflashpacker_1","category":"restaurants_tail","ques":"Book a reservation at one of the best restaurants in Laramie, WY for an early dinner at around 5 PM on 11/20/2025. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"skny.io_2","category":"restaurants_tail","ques":"Book a private room for 20 people at Dead Rabbit Grocery and Grog in New York  City on 12/18/25. If there are no bookings availble for a party of such size, please indicate that in your answer.\r","web":""}
{"id":"restaurants_6","category":"restaurants_tail","ques":"Find soul food hidden gem restaurants in Towaco, New Jersey that are open during lunchtime on 11/21/2025.\r","web":""}
{"id":"theplacearizona_1","category":"restaurants_tail","ques":"What are some specialty cocktails featured at The Place Restaurant in Arizona.\r","web":""}
{"id":"uptown-pizza2.website.spoton_1","category":"restaurants_tail","ques":"List all healthy options available at Uptown Pizza in Tomah, WI. Then, put together an order that would satiate a party of 4.\r","web":""}
{"id":"birchsonthelake_1","category":"restaurants_tail","ques":"Book a reservation for a party of two at a restaurant along a body of water in Long Lake, WI on November 19 at 7:00 PM. Let the staff know that this is a date. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"refugeinthewoodlands_3","category":"restaurants_tail","ques":"Book a reservation at Refuge Restaurant in The Woodlands for a party of four on 12/02/2025 for 9:-0 PM.. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"weatherfordbar_1","category":"restaurants_tail","ques":"Can you help me book a reservation for a party of 5 at Fire Oak Grill in Weatherford, TX on November 22 for the first available table of that day. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"hamadaya-bakery_1","category":"restaurants_tail","ques":"Looking at Hamadaya Bakery in Irvine, compile an order featuring cakes, pastries, and sandwiches to feed a family of three for a meal.\r","web":""}
{"id":"valerienewyorkcity_2","category":"restaurants_tail","ques":"Book a reservation for the next available Sunday brunch at Valerie's in NYC. If the restaurant doesn't take reservations or it is unavailable for that time, please indicate that in your answer\r","web":""}
{"id":"kelty_2","category":"shopping_lists_tail","ques":"Purchase a 65-liter capacity internal frame backpack from Kelty and a rain cover to protect it\r","web":""}
{"id":"kancanusa_3","category":"shopping_lists_tail","ques":"Purchase mid-rise denim bermuda shorts, size 26, from KancanUSA and a blue top, size M, to go with them.\r","web":""}
{"id":"goat_7","category":"shopping_lists_tail","ques":"Purchase Reebok pump sneakers for men in size 10 from Goat and athletic socks to pair with the sneakers, doesn't matter the color.\r","web":""}
{"id":"medline_14","category":"shopping_lists_tail","ques":"Purchase replacement wheels for the Guardian K3 wheelchair from Medline and a tire repair kit for the wheelchair wheels.\r","web":""}
{"id":"irishsetterboots_3","category":"shopping_lists_tail","ques":"Purchase Irish Setter Kasota 6-inch work boots in size 9.5 regular width from irishsetterboots.com, and a pair of brown chukka boots in the same size.\r","web":""}
{"id":"agwheelexpress_5","category":"shopping_lists_tail","ques":"Purchase 14 x 38 double bevel rims in JD yellow from AgWheelExpress, and include a mount hub as well.\r","web":""}
{"id":"birkenstock_11","category":"shopping_lists_tail","ques":"Purchase Birkenstocks Arizona style in black for women from Birkenstock's website and a shoe care kit to keep them in good condition\r","web":""}
{"id":"acrylux_1","category":"shopping_lists_tail","ques":"Add semi-gloss Acrylux Exterior Paint to my cart Acrylux.com and also add brushes or rollers for painting to my cart on Amazon.\r","web":""}
{"id":"colgate_1","category":"shopping_lists_tail","ques":"Purchase 5000 ppm fluoride toothpaste in regular mint flavor from Colgate and a soft bristle toothbrush to use with it.\r","web":""}
{"id":"tcl_11","category":"shopping_lists_tail","ques":"Purchase a 27-inch monitor from TCL.com and a pair of headphones.\r","web":""}
{"id":"shop.rolltide_3","category":"shopping_lists_tail","ques":"Purchase an Alabama vintage t-shirt from the official Alabama Crimson Tide shop and a matching Alabama Crimson Tide cap.\r","web":""}
{"id":"americanstandard-us_23","category":"shopping_lists_tail","ques":"Purchase American Standard 19-inch high toilet in white from American Standard's official website and a electric bidet seat to go with it.\r","web":""}
{"id":"ronellclock_2","category":"shopping_lists_tail","ques":"Purchase 8-inch extra fancy large clock hands from Ronell Clock and a brass brush to help keep it clean\r","web":""}
{"id":"vevor_23","category":"shopping_lists_tail","ques":"Purchase Vevor food process that is at least 10Quarts from Vevor.com and 7.5in meat slicer.\r","web":""}
{"id":"oceanstatejoblot_4","category":"shopping_lists_tail","ques":"Purchase a 9'x12' rectangular indoor/outdoor rug from Ocean State Job Lot and a 18in by 30in kitchen mat.\r","web":""}
{"id":"golfpride_7","category":"shopping_lists_tail","ques":"Purchase Golf Pride tour classic putter grip from Golf Pride and a grip tape to install the putter grip.\r","web":""}
{"id":"craftsman_9","category":"shopping_lists_tail","ques":"Purchase Craftsman 6-gallon portable air compressor from Craftsman.com and a 16 gauge nailer.\r","web":""}
{"id":"m2motorsportinc_2","category":"shopping_lists_tail","ques":"Purchase 22-inch IROC wheels from M2 Motorsport Inc., along with lug nuts suitable for the wheels.\r","web":""}
{"id":"catholicshop_1","category":"shopping_lists_tail","ques":"Purchase a cheap wood rosary from Catholic Shop along with a rosary holder.\r","web":""}
{"id":"beatsbydre_5","category":"shopping_lists_tail","ques":"Purchase studio headphones from Beats by Dre and an extra usb-c charging cable for them.\r","web":""}
{"id":"tagwoodbbq_1","category":"shopping_lists_tail","ques":"Purchase a medium-sized Argentinian charcoal grill from Tagwood BBQ and a cover to go with it.\r","web":""}
{"id":"spreadshirt_3","category":"shopping_lists_tail","ques":"Purchase a black classic rock sweatshirt from Spreadshirt and a hat to go with it.\r","web":""}
{"id":"extremerate_3","category":"shopping_lists_tail","ques":"Purchase 3rd party Switch Joy-Con shells in black or blue from ExtremeRate and a screen protector for my Switch.\r","web":""}
{"id":"surfboards_2","category":"shopping_lists_tail","ques":"Purchase a 9ft longboard surfboard in white, black, blue or green from Surfboards.com and a surfboard leash for it.\r","web":""}
{"id":"tomsstudio_1","category":"shopping_lists_tail","ques":"Purchase a Fountain Pen in any color from Tom's Studio along with a bottle of fountain pen ink for refills.\r","web":""}
{"id":"bacteriostaticwater_1","category":"shopping_lists_tail","ques":"Purchase a 30 mL vial of bacteriostatic water for injection from BacteriostaticWater.com, along with sterile syringes or needles for use with it.\r","web":""}
{"id":"fiestafactorydirect_1","category":"shopping_lists_tail","ques":"Purchase a 12 piece mixed dinnerware set and blue (or green) luncheon plate.\r","web":""}
{"id":"mcfeelys_2","category":"shopping_lists_tail","ques":"Purchase a pack (less than 100) 1/4-20 T-nuts from McFeely's and also a pack of 1/4-20 softwood threaded inserts.\r","web":""}
{"id":"housebeautiful_2","category":"shopping_lists_tail","ques":"Purchase an outdoor smoker online and some wood chips to use with it.\r","web":""}
{"id":"whitemountainshoes_2","category":"shopping_lists_tail","ques":"Purchase heeled sandals for women as well as some winter boots, size 8, from WhiteMountainShoes.com\r","web":""}
{"id":"eyeglasses_16","category":"shopping_lists_tail","ques":"Purchase Swarovski SK1011 frames in black from Eyeglasses.com and then a pair of Guess sunglasses to go with them\r","web":""}
{"id":"frandenim_1","category":"shopping_lists_tail","ques":"Purchase size 30 athletic cut jeans for women from Fran Denim and then another pair of medium wash straight cut jeans.\r","web":""}
{"id":"recwatches_1","category":"shopping_lists_tail","ques":"Preorder a DNA edition Lotus 98T-4 watch and a 24mm strap for it from REC Watches\r","web":""}
{"id":"awaytravel_1","category":"shopping_lists_tail","ques":"Purchase Away \"carry-on\" and \"The bigger carry on\"  luggages from AwayTravel.com\r","web":""}
{"id":"replacementkeys_1","category":"shopping_lists_tail","ques":"Purchase a replacement 703 Yale lock key from EasyKeys and a graphite lubricant for the lock\r","web":""}
{"id":"skipsgarage_1","category":"shopping_lists_tail","ques":"Purchase a professional regulation-size wooden cornhole set from Skip's Garage and cornhole bags to go with it.\r","web":""}
{"id":"gymshark_12","category":"shopping_lists_tail","ques":"Purchase Gymshark Arrival 7\" shorts in navy, size medium, from Gymshark, and a matching regular fit Arrival t-shirt.\r","web":""}
{"id":"computers.microsoft_1","category":"shopping_lists_tail","ques":"Purchase a black Surface Pro 13 tablet with snapdragon X Elite processor and 16GB RAM with a matching keyboard on the official Microsoft store\r","web":""}
{"id":"walgreens_10","category":"shopping_lists_tail","ques":"Purchase a heated foot spa from Walgreens, and Epsom salt to enhance the foot spa experience\r","web":""}
{"id":"vogue-eyewear_2","category":"shopping_lists_tail","ques":"Purchase a pair of pink cat eye sunglasses and a pair of black metal framed sunglasses from Vogue Eyewear\r","web":""}
{"id":"simpletire_5","category":"shopping_lists_tail","ques":"Purchase 4 BFGoodrich 35x10R17 Jeep tires and another 4 Continental ExtremeContact DW tires SimpleTire\r","web":""}
{"id":"picktrampoline_1","category":"shopping_lists_tail","ques":"Purchase 8.5 inch 14ft trampoline replacement springs (pack of 84) from Trampoline Parts And Supply and a heavy duty safety pad cover.\r","web":""}
{"id":"uniqlo_8","category":"shopping_lists_tail","ques":"Purchase a men's jacket in size Medium and a matching pair of gloves from Uniqlo.\r","web":""}
{"id":"rvusa_11","category":"shopping_lists_tail","ques":"Purchase the new Aliner 2025 Evolution from RVUSA, and also buy a towing cover for the RV.\r","web":""}
{"id":"frederickbuechner_1","category":"shopping_lists_tail","ques":"Purchase 'Wishful Thinking: A Seeker's ABC' by Frederick Buechner (1993) and \"Godric: A Novel\" from Amazon\r","web":""}
{"id":"saraschildrensbtq_1","category":"shopping_lists_tail","ques":"Purchase boys' size 10 communion suit and a matching tie from Sara's Children's Boutique in Jamison, PA.\r","web":""}
{"id":"everythingarcticcatoffroad_2","category":"shopping_lists_tail","ques":"Purchase any appropriate black Arctic Cat Prowler Pro side mirrors and review mirros from Everything Arctic Cat Off-Road.\r","web":""}
{"id":"polaroid_1","category":"shopping_lists_tail","ques":"Purchase a Polaroid Now Gen 3 Memories Set from Polaroid's website and extra Color I-type film to go with it.\r","web":""}
{"id":"birdbgone_1","category":"shopping_lists_tail","ques":"Purchase silicone adhesive and a dripless caulking gun to apply it from Bird BGone.\r","web":""}
{"id":"vintagesingerparts_2","category":"shopping_lists_tail","ques":"Purchase Singer Sewhandy Model 50 machine needles, Size 14, from Vintage Singer Parts, and extra bobbins for the sewing machine.\r","web":""}
{"id":"landsend_23","category":"shopping_lists_tail","ques":"Purchase men's knit nightshirt in size Large and a pair of slippers to complement it, both from Lands' End.\r","web":""}
{"id":"amazon_comparison_shopping_41","category":"price_comparison","ques":"help me compare the price of the red George Foreman Indoor/Outdoor Electric Grill that can make 12 servings at both walmart and target. Make sure to check the actual product pages; which one is cheaper?\r","web":""}
{"id":"samsclub_comparison_shopping_2","category":"price_comparison","ques":"help me compare the price of the yellow/navy women's adidas Originals Samba sneaker at both amazon and foot locker. Output a table of the price of each after you check their respective product pages.\r","web":""}
{"id":"amazon_comparison_shopping_297","category":"price_comparison","ques":"can you compare the price and dimensions of outdoor drop box mailboxes on uline and home depot? Which one is bigger and which one is cheaper?\r","web":""}
{"id":"homedepot_comparison_shopping_421","category":"price_comparison","ques":"what standard length of vinyl outside corner trim does homedepot sell vs Southeastern Building Products, and what is the price per unit they sell? Make sure to confirm the product details on the webpages.\r","web":""}
{"id":"napaonline_comparison_shopping_8","category":"price_comparison","ques":"help me compare coil spring boosters/spacers (front) from rock auto and napa. What are the part numbers and prices from each website?\r","web":""}
{"id":"lowes_comparison_shopping_216","category":"price_comparison","ques":"I want to know where to buy a 3-arm wall-mounted pivoting Towel Bar between homedepot and wayfair. Figure out which one is cheaper and which one has more reviews by visiting the product pages.\r","web":""}
{"id":"lowes_comparison_shopping_231","category":"price_comparison","ques":"please help compare the price of the CRAFTSMAN Cmmt45305 mechanic tool set at both walmart and acmetools, which is cheaper and how many pieces are in the set?\r","web":""}
{"id":"ebay_comparison_shopping_154","category":"price_comparison","ques":"can you look up the prices of the 40v Kobalt Cordless 15-inch String trimmer on both amazon and walmart (it's blue) and tell me which one is cheaper and how much a 2-year warranty add-on would be for each?\r","web":""}
{"id":"kohls_comparison_shopping_1","category":"price_comparison","ques":"can you compare the IZOD Men's Golf Swing Flex Cargo Short on kohls and amazon and tell me the price and level of sun protection they offer for each?\r","web":""}
{"id":"autozone_comparison_shopping_61","category":"price_comparison","ques":"compare the price of a replacement 2016 Hyundai Genesis Grille from carparts.com and amazon. What is the price and Partslinks number from each websites?\r","web":""}
{"id":"ebay_comparison_shopping_90","category":"price_comparison","ques":"Can you compare the pricing and package sizes for the Rockshark 36V e-bike battery charger between eBay and Amazon? Please check the actual product pages to confirm prices and package details.\r","web":""}
{"id":"basspro_comparison_shopping_2","category":"price_comparison","ques":"Compare the pricing and package sizes for dog beds between Bass Pro Shops and Chewy to find the best value—make sure to check the actual product pages for each bed’s price and dimensions.\r","web":""}
{"id":"aliexpress_comparison_shopping_11","category":"price_comparison","ques":"can you compare the price and length of a dual 8Pin-to-16Pin Graphics Card Power Adapter Cable (it is a Y-shaped cord) on both ebay and newegg.\r","web":""}
{"id":"amazon_comparison_shopping_98","category":"price_comparison","ques":"I want you to compare the price of Regis Rossi's \"Intelligence émotionnelle\" book between Amazon and Apple books?\r","web":""}
{"id":"homedepot_comparison_shopping_440","category":"price_comparison","ques":"Help me compare the price of the Direct Drive wireless keypad garage door opener at Home Depot and Amazon\r","web":""}
{"id":"homedepot_comparison_shopping_482","category":"price_comparison","ques":"Can you help me compare the features and specifications of Terro Indoor Liquid Ant Killer Baits at both home depot and uline, what the price and number of baits per box sold at each?\r","web":""}
{"id":"ebay_comparison_shopping_454","category":"price_comparison","ques":"what is the price of a dozen Vital Farms Pasture Raised Eggs at Whole Foods and Walmart?\r","web":""}
{"id":"wholefoodsmarket_comparison_shopping_7","category":"price_comparison","ques":"what is the price of a dozen Vital Farms Pasture Raised Eggs at Target and Giant?\r","web":""}
{"id":"dickssportinggoods_comparison_shopping_6","category":"price_comparison","ques":"Compare the prices of boys' black swim trunks between Dick's Sporting Goods and Amazon by checking the actual product pages for shipping costs and estimated delivery windows.\r","web":""}
{"id":"bestbuy_comparison_shopping_74","category":"price_comparison","ques":"Help me compare the price of the iBUYPOWER Scale gaming desktop PC (Intel Core i5-14400F, NVIDIA GeForce RTX 4060, 16GB DDR5, 1TB NVMe) at Best Buy and Walmart to determine which is cheaper. Make sure to check the actual product pages to confirm current pricing.\r","web":""}
{"id":"homedepot_comparison_shopping_13","category":"price_comparison","ques":"Does Home Depot or Amazon offer more color options for the Samsung 27-inch laundry pedestal storage drawer? What are the color options available from each retailer? Make sure to check the actual product pages to confirm available finishes.\r","web":""}
{"id":"amazon_comparison_shopping_77","category":"price_comparison","ques":"Can you help me compare the price and dimensions of the NECA Dungeons & Dragons Ultimate Strongheart action figure available at Target  vs Walmart formatted as a table? Make sure to check the actual product pages to confirm details.\r","web":""}
{"id":"bestbuy_comparison_shopping_45","category":"price_comparison","ques":"I would like you to compare the price of Xbox Series X black console at Best Buy vs Microsoft's websites, format your output as a table including the url, retailer, and price.\r","web":""}
{"id":"heb_comparison_shopping_1","category":"price_comparison","ques":"Compare the price and brands for  cherry flavored night time cold & flu relief liquid between H-E-B and Amazon by checking the actual product pages. Specifically, output a table of the product name, price, and price per ounce for each.\r","web":""}
{"id":"ebay_comparison_shopping_230","category":"price_comparison","ques":"which store sells the Nitecore EDC31 Compact Tactical EDC Flashlight for less -- Amazon or walmart?\r","web":""}
{"id":"lowes_comparison_shopping_227","category":"price_comparison","ques":"which retailer sells the marey 2.0 GPM Electric Tankless Water Heater for less homedepot or lowes?\r","web":""}
{"id":"samsclub_comparison_shopping_16","category":"price_comparison","ques":"Help me compare the price of ribeye steak at target and walmart, noting how many steaks per tray.\r","web":""}
{"id":"ebay_comparison_shopping_450","category":"price_comparison","ques":"Help me compare the price of Super Mario 3D All-Stars for Nintendo Switch at eBay and Amazon, which is cheaper? Make sure to check the actual product pages to confirm the price.\r","web":""}
{"id":"walmart_comparison_shopping_270","category":"price_comparison","ques":"Compare the shipping options and delivery times for a Pro Lift  lawn mower jack between Walmart and Amazon. Make sure to check the actual product pages for available shipping methods and estimated delivery windows.\r","web":""}
{"id":"walmart_comparison_shopping_245","category":"price_comparison","ques":"Compare options and prices for buying sports whistles between Walmart and Amazon, checking the actual product pages to confirm details.\r","web":""}
{"id":"walmart_comparison_shopping_22","category":"price_comparison","ques":"Compare the bulk pricing and package sizes for top soil between Walmart and Home Depot to find the best value per unit. Please check the actual product pages to confirm package weights and prices.\r","web":""}
{"id":"nordstrom_comparison_shopping_46","category":"price_comparison","ques":"Compare the pricing for women's navy blazers between Nordstrom and Macy's to find which retailer offers the best value—make sure to check the actual product pages for current prices and size availability.\r","web":""}
{"id":"walmart_comparison_shopping_375","category":"price_comparison","ques":"Can you help me compare the price and dimensions of kids bumper cars at Walmart vs Amazon formatted as a table? Please check the actual product pages to confirm each spec.\r","web":""}
{"id":"walmart_comparison_shopping_424","category":"price_comparison","ques":"compare the price of the Dyson V11 cordless vacuum from their official website vs bestbuy, how much are the monthly payments with each of their suggested buy now, pay later options?\r","web":""}
{"id":"ebay_comparison_shopping_58","category":"price_comparison","ques":"how much more is the The Enforcer Blue-ray than the DVD on amazon? How much is the DVD at BestBuy?\r","web":""}
{"id":"target_comparison_shopping_112","category":"price_comparison","ques":"how much is a 6 pack of white undershirts at target vs at walmart?\r","web":""}
{"id":"homedepot_comparison_shopping_18","category":"price_comparison","ques":"how many different options of 3-way coaxial cable splitters does HomeDepot sell and what is the difference between the cheapest and most expensive option\r","web":""}
{"id":"walmart_comparison_shopping_220","category":"price_comparison","ques":"Help me compare the price of Food For Life Baking Co. Organic Ezekiel 4:9 Sprouted Whole Grain Cereal (16 oz) at Walmart and Amazon to determine which is more cost-effective. Please check the actual product pages to confirm the prices.\r","web":""}
{"id":"ebay_comparison_shopping_436","category":"price_comparison","ques":"How much more is the Elephant Terry 33 cm than the Miffy ECO Tiny Teddy - 23 cm on bontontoys.com\r","web":""}
{"id":"sephora_comparison_shopping_8","category":"price_comparison","ques":"how much is Giorgio Men's Acqua di Giò Eau de Toilette Spray, 1.6 oz at Macy's vs at Sephora?\r","web":""}
{"id":"dickssportinggoods_comparison_shopping_28","category":"price_comparison","ques":"I’m thinking of getting my son a Justin Jefferson jersey for his birthday, how much more is a small on the vikings' official website than on Dick's sporting goods?\r","web":""}
{"id":"ulta_comparison_shopping_4","category":"price_comparison","ques":"Look at the price and number of reviews of Ouai Hair and Body Mist Travel size on their official site vs on Ulta, and output a table with the price, retailer, and number of reviews.\r","web":""}
{"id":"walmart_comparison_shopping_285","category":"price_comparison","ques":"what are the all the different colors men's 7\" sweat shorts are available in on Old Navy, and is that less or more than the equivalent product on Target's website?\r","web":""}
{"id":"rockauto_comparison_shopping_4","category":"price_comparison","ques":"what is the MSRP for a GM Genuine 84440529 Side Object Sensor Module on gmparts.com, and how much more is that than on gmpartscenter.net\r","web":""}
{"id":"dickssportinggoods_comparison_shopping_40","category":"price_comparison","ques":"find three different online retailers that sell GM part number 84440529 and list their prices from lowest to highest\r","web":""}
{"id":"walmart_comparison_shopping_147","category":"price_comparison","ques":"Help me compare the price of the FRAM CV10134 TrueAir Premium cabin air filter for a 2012 Honda Civic at Walmart and AutoZone, which is cheaper? Make sure to check the actual product pages to confirm the price.\r","web":""}
{"id":"homedepot_comparison_shopping_97","category":"price_comparison","ques":"how much more is the 4-in x 6-in x 12-ft pressure-treated ground-contact southern pine timber on homedepot than their 4 x 4 x 10 ft?\r","web":""}
{"id":"walmart_comparison_shopping_125","category":"price_comparison","ques":"can you find three options of where to buy Smino Luv 4 Rent translucent green 2-LP explicit vinyl and list their prices and urls\r","web":""}
{"id":"ebay_comparison_shopping_118","category":"price_comparison","ques":"create a table of three retailers where you can buy  For Whom the Bell Tolls and in the columns put the price for the paperback and hardcover separately\r","web":""}
{"id":"homedepot_comparison_shopping_20","category":"price_comparison","ques":"help me research where to buy A Tale of Two Cities and output a table of retailers in the rows, and in the columns put the price for the paperback and hardcover separately\r","web":""}
{"id":"homedepot_comparison_shopping_165","category":"price_comparison","ques":"I need to buy a 6-pack of ankle athletic socks, please find 2 different retailers and the price at which they offer the product\r","web":""}
{"id":"ebay_comparison_shopping_113","category":"price_comparison","ques":"find three different options of where to buy purple leather paisley pants and output a list of the prices for each site.\r","web":""}
{"id":"tractorsupply_comparison_shopping_19","category":"price_comparison","ques":"Could you compare the pricing and capacity (in gallons) of steel water troughs between Tractor Supply Co and Amazon to see which offers the best value per gallon? Please check the actual product pages to confirm prices and tank sizes.\r","web":""}
{"id":"zappos_comparison_shopping_1","category":"price_comparison","ques":"Can you help me compare the price of the cheapest men's Adidas Stan Smith sneakers at Zappos vs Foot Locker and tell me which site is cheaper overall?\r","web":""}
{"id":"target_comparison_shopping_27","category":"price_comparison","ques":"find the pack of papermate rainbow pens at target that has the most colors, and tell me how many more or less colors it has in it than the most colorful pack at walmart?\r","web":""}
{"id":"wayfair_comparison_shopping_3","category":"price_comparison","ques":"Can you help me compare the features and specifications (material, fill weight, care instructions, dimensions) of California King burgundy bedspreads available at Wayfair vs Amazon formatted as a table? Please check the actual product pages to confirm the details.\r","web":""}
{"id":"amazon_comparison_shopping_456","category":"price_comparison","ques":"Can you help me compare the type of rope and length it is sold in of clothesline rope available at Amazon vs Home Depot. Please check the actual product pages to confirm details like material, length, diameter, and weight capacity.\r","web":""}
{"id":"composite_116","category":"compositional_tasks_v2","ques":"Check Steam for the first  top-selling game today that has a TV series adaptation if any, then use JustWatch.com to find streaming services for the series adaptation.\r","web":""}
{"id":"composite_23","category":"compositional_tasks_v2","ques":"On Eventbrite.com, find a live music event in Nashville, TN happening this upcoming Saturday. Then on Spotify.com, find a songs by any of the performing artists from that event, if any. \r","web":""}
{"id":"composite_78","category":"compositional_tasks_v2","ques":"Look at the amazon page for \"The Innovator's Dilemma\", see what it ranks in books overall, and then find a repair service anywhere in the US whose phone number contains that rank as a sub-string. Output the name and phone number of that repair service.\r","web":""}
{"id":"composite_121","category":"compositional_tasks_v2","ques":"On Wikipedia.org, look up Harvard University to find its location; then on Google Maps, get walking directions to Boston City Hall from this location.\r","web":""}
{"id":"composite_62","category":"compositional_tasks_v2","ques":"Locate a coding bootcamp company in brooklyn, NYC, and tell me how much full-time tuition would cost there. Then use Google Maps to tel lme which bus I can take from Grand Army Plaza to reach there. Output the name of the bootcamp, the tuition cost, and the bus service name.\r","web":""}
{"id":"composite_89","category":"compositional_tasks_v2","ques":"Go to lettuce.com and find the first restaurant after filtering their portfolio for spanish cuisine, then go their website to order, and add the 4 most commonly-ordered items to the cart and proceed to checkout. Also output and the prices of those 4 items.\r","web":""}
{"id":"composite_6","category":"compositional_tasks_v2","ques":"On Booking.com, find the cheapest available 8/10+ scored hotel room for a three-night stay starting December 15, 2025, in Jakarta for 2 adults. Use the hotel's address to search for the closest coffee shop, output it's name and address.\r","web":""}
{"id":"composite_87","category":"compositional_tasks_v2","ques":"on bklynlibrary.org find the northern-most library branch that has a teen tech help center, then find the year that branch opened to the public, how many square feet of space it has, and who the managing librarian is.\r","web":""}
{"id":"composite_81","category":"compositional_tasks_v2","ques":"Retrieve the lowest-price round-trip flight from Dallas (DFW) to Miami (MIA) on Jan 20, 2026, to Jan 25, 2026, using Google Flights. Noting the flight's arrival timestamp in miami, book the cheapest compact car from Miami International on Rentalcars.com beginning no less than one hour after the flight arrives. For the first result output the price per day, make/model, and number of seats.\r","web":""}
{"id":"composite_56","category":"compositional_tasks_v2","ques":"find what xbox.com says is a  top-selling xbox game; note who it was published by and the release date. Then tell me how many years have elapsed since when the CEO or head of that gaming studio was born and the release date.\r","web":""}
{"id":"composite_99","category":"compositional_tasks_v2","ques":"Search for a \"applied scientist\" position on careers.microsoft.com in redmond, WA and for the first result, extract what the team or group name the job posting is for, and then search externally for what that group does and who it is led by.\r","web":""}
{"id":"composite_51","category":"compositional_tasks_v2","ques":"at the denver museum of nature and science, find the next show held at the Infinity Theater, and find out who the producer is, and furthermore the names of up to three other films/movies they produced.\r","web":""}
{"id":"composite_50","category":"compositional_tasks_v2","ques":"List all the members of the bands Nsync and BackStreet Boys. Find the net worth of the one with the longest last name.\r","web":""}
{"id":"composite_40","category":"compositional_tasks_v2","ques":"Search for women's clothes on sale at zara, take the first result that is marked down, find out what materials it is composed of, and then tell me at what temperature the primary material ignites.\r","web":""}
{"id":"composite_79","category":"compositional_tasks_v2","ques":"on amazon, find the #3 best selling pantry staple item, and then on AllRecipes, find a recipe which contains that item as an ingredient. Output the full ingredients list along with the recipe name.\r","web":""}
{"id":"composite_120","category":"compositional_tasks_v2","ques":"Please help me find the first news article published on universityofcalifornia.edu websites, then tell me two other articles published by the same author.\r","web":""}
{"id":"composite_67","category":"compositional_tasks_v2","ques":"find the next upcoming exhibit at the George H.W. Bush library and tell me what dates it will be available. Tell me whether any total solar eclipse will occur at all within that time frame.\r","web":""}
{"id":"composite_38","category":"compositional_tasks_v2","ques":"Find a vegetarian restaurant in San Francisco with a rating ≥4.5 and ≥100 reviews; use its address to book a compact car nearest to that location on Rentalcars.com from December 15 to December 18, 2025.\r","web":""}
{"id":"composite_100","category":"compositional_tasks_v2","ques":"find a reddit post in r/golf talking about how golf courses take up \"3000 sq miles\" of land in the USA. Summarize the top upvoted comment for that post, and then find another website that substantiates any major claim that comment makes.\r","web":""}
{"id":"composite_123","category":"compositional_tasks_v2","ques":"On Eventbrite.com, find an art exhibition happening this month in Portland and extract the exact date and venue; then check Google Flights for the cheapest same-day round-trip tickets from Seattle (SEA) to Portland (PDX), completing the task before purchase.\r","web":""}
{"id":"composite_5","category":"compositional_tasks_v2","ques":"From Google Flights, record the least expensive one-way flight from Edinburgh (EDI) to Manchester (MAN) on December 28, 2025, then figure out what aircraft type the flight is on, and how many fewer passengers that aircraft type can carry compared to a 747-8 all-economy configuration.\r","web":""}
{"id":"composite_68","category":"compositional_tasks_v2","ques":"Plan an itinerary of getting from central park, manhattan, to miami by taking trains only!\r","web":""}
{"id":"composite_111","category":"compositional_tasks_v2","ques":"find out how many views Adele's \"Rolling in the Deep (Official Music Video)\" has, and then determine what percent of the worlds population that is using a calculator or equivalent search tool.\r","web":""}
{"id":"composite_21","category":"compositional_tasks_v2","ques":"On Wikipedia.org, look up the first Sister City of the city in which Massachusetts Institute of Technology (MIT) resides, and retrieve the 5-day weather forecast for that sister city.\r","web":""}
{"id":"composite_61","category":"compositional_tasks_v2","ques":"find the location of the first race listed on raceroster.com, and then find the address of a café or coffee shop nearby that I can wait for my husband at while he finishes the race.\r","web":""}
{"id":"composite_22","category":"compositional_tasks_v2","ques":"Locate the location of the upcoming NeurIPS conference in 2025 and then find the best local food near the event venue\r","web":""}
{"id":"composite_114","category":"compositional_tasks_v2","ques":"Locate the top-seller RPG game on Steam and identify its matching game controller. On Amazon, find this controller and add it to the cart, stopping at the review page.\r","web":""}
{"id":"composite_106","category":"compositional_tasks_v2","ques":"use a mortgage rate calculator tool online to see what my estimated monthly payment will be (including only principal and interest) for a $500,000 home with a down payment of $80,000 over 30 years at an interest rate of 6.0% in 98101.\r","web":""}
{"id":"composite_94","category":"compositional_tasks_v2","ques":"I want to learn how much I should save for my 2-year olds college fund. Use the Office of Financial Rediness college savings calculator and input the following fields: 3% education cost inflation, $50,000 in current savings, $250 in monthly contributions with 6% rate of return. If their tuition is going to be $50,000 per year and room/board $12,000, how much more per month do i need to save according to the tool? (Hint: do not use the sliders)\r","web":""}
{"id":"composite_75","category":"compositional_tasks_v2","ques":"go to investor.gov and compute how much money I will have with an initial principle of $10000, to which I make monthly contributions of $200 over 10 years. Assume an interest rate of 5.0 compounded quarterly. Additionally, tell me the colors of the lines it plots in the results.\r","web":""}
{"id":"composite_96","category":"compositional_tasks_v2","ques":"can you go the latest news release from the US Dept. of Labor, and tell me who the media contact is and how many other contacts there are in their department?\r","web":""}
{"id":"composite_31","category":"compositional_tasks_v2","ques":"Find one of Beyonce's favorite soul food restaurants in houston, go to their website, and find out when they opened. How much older are they than Beyonce herself?\r","web":""}
{"id":"composite_58","category":"compositional_tasks_v2","ques":"On Wikipedia.org, find the city containing the oldest university in the US,  use this location to find the lowest priced compact car rental for November 17-19, 2025, on Rentalcars.com.\r","web":""}
{"id":"composite_82","category":"compositional_tasks_v2","ques":"can you find a quote from Dario Amodei saying that AI will take a lot of jobs. What did he predict the unemployment rate would be, and how many percentage points higher is that than the maximum unemployment the US experienced in 2001?\r","web":""}
{"id":"composite_74","category":"compositional_tasks_v2","ques":"Find a job on USA jobs in the 10003 area code, and tell me whether the salary of the first listing is above or below the median for that role nationally on salary.com\r","web":""}
{"id":"composite_25","category":"compositional_tasks_v2","ques":"find an official microsoft support page showing a tutorial about pivot tables. Somewhere on that page, they must have an example spreadsheet or screenshot of one. What is the first row of that example table?\r","web":""}
{"id":"composite_55","category":"compositional_tasks_v2","ques":"On Steam, find the top-selling horror game and note its associated guidebook. On Amazon, search for this guidebook and add it to the cart, stopping at the cart review page.\r","web":""}
{"id":"composite_7","category":"compositional_tasks_v2","ques":"On Booking.com, find the cheapest hotel available for a four-night stay from November 20–14, 2025, in San Francisco, California, for 1 adult. Use the hotel's address to identify the closest grocery store and tell me its name and address.\r","web":""}
{"id":"composite_60","category":"compositional_tasks_v2","ques":"Search for any AI  conferences or workshops in San Francisco this month, noting the date and location; then on Google Flights, secure a viable round-trip flight from Toronto (YYZ) to San Francisco  on the summit date, stopping before booking.\r","web":""}
{"id":"composite_91","category":"compositional_tasks_v2","ques":"I need to find a job with Secret security clearance on USAjobs.com, can you find the first job in the list that has an annual salary, and then use another tool to compute what my after tax takehome pay would be for that job?\r","web":""}
{"id":"composite_42","category":"compositional_tasks_v2","ques":"On LinkedIn.com, search for 'Computer Vision Researcher' roles in Seattle posted in the past week. Find me the latest computer vision course from stanford available for free online to prep.\r","web":""}
{"id":"composite_29","category":"compositional_tasks_v2","ques":"look at the first article published on searchengineland.com, summarize the key takeaway, and then find another article from a different site that supports / verifies it.\r","web":""}
{"id":"composite_112","category":"compositional_tasks_v2","ques":"Locate a headline jazz event in Los Angeles featuring multiple artists in the near future, select the headline artist, and subsequently find and play a song from this artist on Spotify.com.\r","web":""}
{"id":"composite_4","category":"compositional_tasks_v2","ques":"Using Google Maps, tell me how many miles it is to drive from Manchester Airport to Etihad Stadium, and whether that is longer or shorter than the distance from the george washington bridge to the NYSE.\r","web":""}
{"id":"composite_53","category":"compositional_tasks_v2","ques":"Identify three jazz clubs in Chicago, and determine their neighborhoods; afterward, use Booking.com to find the least expensive hotel for a one-night stay in the first of those neighborhoods (sorted alphabetically) on December 28, 2025, for 2 adults.\r","web":""}
{"id":"composite_27","category":"compositional_tasks_v2","ques":"find the best mens face wash according to GQ or mens health, then buy it from amazon.com\r","web":""}
{"id":"composite_85","category":"compositional_tasks_v2","ques":"Find the address for the office of 'Bright Future Forever' based in Seattle, WA; and then tell me the name of one of the DDS that works at the dental office across the street and where they graduated from undergrad.\r","web":""}
{"id":"composite_63","category":"compositional_tasks_v2","ques":"I want to find a Compliance Specialist job on NYC jobs for the city of new york and calculate my takehome pay if I were to get it. Assume the maximum end of the salary range and use smartasset.com tell me both what the take-home pay would be and effective tax rate.\r","web":""}
{"id":"composite_52","category":"compositional_tasks_v2","ques":"On reddit, search for blues club in New Orleans and take the first one mentioned in the comments. What was the most recent comment that user made according to their reddit profile, and does it appear from their comments they actually live in Louisiana?\r","web":""}
{"id":"composite_16","category":"compositional_tasks_v2","ques":"Find the names of the three \"dynasties\" that preside over broadway theater houses, and find out how many theaters each owns.\r","web":""}
{"id":"composite_84","category":"compositional_tasks_v2","ques":"during the first week of December, find the cheapest hotel in New York in times square then find tickets for the lion king or MJ the musical that week\r","web":""}
{"id":"composite_124","category":"compositional_tasks_v2","ques":"Can you tell me the cost structure of a one-year certificate program in New York City at the International Center of Photography and how it is different than the same program at the New York Film Academy.\r","web":""}
{"id":"composite_57","category":"compositional_tasks_v2","ques":"I'm deciding between enrolling in stanford vs johns hopkins as a freshman, can you tell me how much a full-year (2 semester or 3 quarter) meal plan costs at each university (assuming I will eat the maximum number allowed or unlimited meals).\r","web":""}
{"id":"composite_43","category":"compositional_tasks_v2","ques":"On genentech's website, first tell me how many open roles there are in the regulatory & quality department at each job level, and secondly filter to the most senior job level and tell me what it's salary range is.\r","web":""}
{"id":"composite_98","category":"compositional_tasks_v2","ques":"Find top 'Software Engineer' roles in Seattle for an established big-tech company on LinkedIn.com and retrieve the associated company name; use the company name on Wikipedia.org to find the year it was founded.\r","web":""}
{"id":"tripadvisor_other_event_5","category":"ticketing","ques":"I plan on going to Fantastic Caverns in Springfield, MO on 12/2/2025 with my wife and two kids under 12. See if there are any discounts available online, either for a group discount or an age discount, and book tickets if any tickets are available at 3:00 PM.\r","web":""}
{"id":"discounts.aaa_theme_park_16","category":"ticketing","ques":"Can you help me buy Walt Disney World theme park tickets for two in Florida from AAA online for any day over 12/11-12/15 ? Please let me know if they're not available.\r","web":""}
{"id":"vacourts.gov_citation_13","category":"ticketing","ques":"Can you help me pay my Virginia traffic ticket online via the Virginia Courts website? Please let me know if there are any issues with completing the payment.\r","web":""}
{"id":"palaciodemafra.pt_other_event_1","category":"ticketing","ques":"Can you help me buya  Mafra Museum visit ticket online from the Palácio de Mafra website on December 20th? Please let me know if they aren't available.\r","web":""}
{"id":"universalorlando_theme_park_16","category":"ticketing","ques":"I plan on going to Universal Orlando Resort in Orlando, FL around Christmastime with my family of four. Could you please assist me in securing tickets? Please let me know if there are any issues or if they're not available.\r","web":""}
{"id":"pacificbonsaimuseum_other_event_1","category":"ticketing","ques":"I really want to see the Weyerhaeuser Company Bonsai Exhibit at the Pacific Bonsai Museum in Federal Way, WA with my boyfriend. Would it be possible to book tickets online for November 28th? Let me know if they're not available anymore.\r","web":""}
{"id":"americasriverroots_music_event_1","category":"ticketing","ques":"Can you help me buy the soonest Celebration Belle Riverfest 2025 tickets for me and my parents? Let me know if they're no longer available.\r","web":""}
{"id":"ludlowgaragecincinnati_music_event_1","category":"ticketing","ques":"Can you help me the upcoming buy Barrington Levy concert tickets online within a 50 mile radius of Cincinnati, OH? Please let me know if they aren't available anymore.\r","web":""}
{"id":"eventbrite_other_event_36","category":"ticketing","ques":"I am based in thie Chicago, IL. Can you help me buy the next Marriott bridal show tickets at a Marriott Hotel in the greater Chicago area on Eventbrite? Please let me know if the tickets aren't available.\r","web":""}
{"id":"romehacks_music_event_1","category":"ticketing","ques":"Can you help me get two tickets for the Vatican museums on January 9th at 1 PM? Let me know if they're not available anymore.\r","web":""}
{"id":"caminitodelrey.info_other_event_2","category":"ticketing","ques":"Can you help me buy 5 Caminito del Rey tickets online in Malaga, Spain from the official Caminito del Rey website in two wees? Please let me know if they aren't available anymore.\r","web":""}
{"id":"ticketmaster_music_event_192","category":"ticketing","ques":"Can you help me buy a ticket at an upcoming event at Shoreline Amphitheatre in Mountain View, CA on Ticketmaster? Please let me know if they're not available.\r","web":""}
{"id":"fandango_movie_87","category":"ticketing","ques":"Can you help me buy 12 Superman 2025 movie tickets online on Fandango next Wednesday? We have four youth in our group. Please let me know if they aren't available.\r","web":""}
{"id":"anaheim_citation_3","category":"ticketing","ques":"Can you help me pay my City of Anaheim Police Department traffic ticket online? Please let me know if there are any issues with completing the payment.\r","web":""}
{"id":"bahn.de_transportation_3","category":"ticketing","ques":"Can you help me buy Deutsche Bahn train tickets from Munich to Vienna online on bahn.de on February 3rd? Please let me know if the tickets aren't available.\r","web":""}
{"id":"amazon_lottery_2","category":"ticketing","ques":"Can you help me buy pre-numbered blank raffle tickets on Amazon? Please let me know if they're not available for purchase.\r","web":""}
{"id":"portalnjmcdirect-cloud.njcourts.gov_citation_35","category":"ticketing","ques":"Can you help me pay my New Jersey municipal court ticket online via NJMCDirect? Please let me know if there are any issues with completing the payment.\r","web":""}
{"id":"showtimes_movie_44","category":"ticketing","ques":"Can you help me buy a Downton Abbey movie tickets online for Dietrich Theater in Tunkhannock, PA? I would prefer seats in the center back. Let me know if they're not available.\r","web":""}
{"id":"morgancountyutah.gov_citation_1","category":"ticketing","ques":"Could you help me pay my ticket online at the Morgan County, Utah District Court? Please let me know if there are any issues with the payment process.\r","web":""}
{"id":"confirmtkt_transportation_1","category":"ticketing","ques":"Can you help me book six round-trip railway tickets online on ConfirmTkt from New Dehli to Mumbai Central?  I would like to travel over March 1st-14th. Let me know if there aren't any tickets available.\r","web":""}
{"id":"buckeyecountrysuperfest_music_event_1","category":"ticketing","ques":"Can you help me buy Buckeye Countryfest tickets from the Buckeye Country Superfest website? Please let me know if they're not available.\r","web":""}
{"id":"united_transportation_10","category":"ticketing","ques":"Could you help me book a United Airlines direct flight ticket on January 7th from Little Rock, Arl to Providence, RI online through United.com? Let me know if there are any issues or if the tickets aren’t available.\r","web":""}
{"id":"costco_theme_park_12","category":"ticketing","ques":"Can you help me buy Universal Studios theme park tickets online from Costco from December 20th to January 2nd for two people? Please let me know if they're not available.\r","web":""}
{"id":"ticketmaster_sporting_event_31","category":"ticketing","ques":"Can you help me buy  three Toronto Maple Leafs game tickets in Toronto, ON  for the upcoming game on NHL.com? Please let me know if they're not available anymore.\r","web":""}
{"id":"lacourt.ca.gov_citation_13","category":"ticketing","ques":"Can you help me pay my Los Angeles County speeding ticket online on the LA Court website? Please let me know if there are any issues with the payment process.\r","web":""}
{"id":"regmovies_movie_58","category":"ticketing","ques":"Can you help me buy three tickets for the any PG-13 movie online at Regal Cinemas near Fairbanks, AK? Please let me know if they aren't available.\r","web":""}
{"id":"thesphere_other_event_20","category":"ticketing","ques":"Can you help me purchase four The Wizard of Oz Experience tickets online on The Sphere website in Las Vegas on December 1st at 5:00 PM? Please let me know if they aren't available.\r","web":""}
{"id":"albemarle.edu_music_event_1","category":"ticketing","ques":"Could you help me reserve two tickets for any event online from the College of the Albemarle Performing Arts Center in Elizabeth City, NC? Please let me know if they're not available.\r","web":""}
{"id":"koobit_music_event_2","category":"ticketing","ques":"Can you help me purchase Florence + The Machine Everybody Scream Tour tickets on StubHUb? Please let me know if they are sold out.\r","web":""}
{"id":"azfamily_citation_1","category":"ticketing","ques":"Can you please help me pay my photo radar traffic ticket online in Paradise Valley, AZ? Let me know if there are any issues processing the payment.\r","web":""}
{"id":"sanbernardino.courts.ca.gov_citation_3","category":"ticketing","ques":"Can you help me pay my San Bernardino County traffic ticket online via the San Bernardino County Superior Court website? Please let me know if there are any issues completing the payment.\r","web":""}
{"id":"flyontario_transportation_1","category":"ticketing","ques":"Could you help me book the first available flight tickets from Ontario International Airport  to New York City using FlyOntario? Please let me know if there are any issues with availability.\r","web":""}
{"id":"stpaul.gov_citation_1","category":"ticketing","ques":"Could you please pay my City of St. Paul parking ticket online for me? Let me know if there are any issues with completing the payment.\r","web":""}
{"id":"mncourts.gov_citation_3","category":"ticketing","ques":"Could you please pay my St. Louis County, MN speeding ticket online through the Minnesota Courts website? Let me know if there are any issues or if you can't complete the payment.\r","web":""}
{"id":"ges.wcs.edu_other_event_1","category":"ticketing","ques":"Can you help me buy the next GES Fest tickets online in Dallas, TX? Please let me know if they're not available.\r","web":""}
{"id":"nerdwallet_theme_park_9","category":"ticketing","ques":"Can you help me buy discounted Epic Universe theme park tickets in Orlando, FL online around Christmastime? Consider looking at blogposts for resources, as well as AAA, Undercover tourist, and other sites with discounted websites. Please let me know if they aren't available.\r","web":""}
{"id":"seattlegreatwheel_theme_park_1","category":"ticketing","ques":"Could you assist me with purchasing Seattle Great Wheel tickets online from the Seattle Great Wheel website on the upcoming Sunday at around 7 PM? Please let me know if they're not available.\r","web":""}
{"id":"aquarionwater_theme_park_1","category":"ticketing","ques":"Can you help me buy discounted Mystic Aquarium tickets online in Mystic, CT for me and my veteran father? I plan on going the upcoming Saturday morning. Let me know if they aren't available anymore.\r","web":""}
{"id":"ticketmaster_music_event_25","category":"ticketing","ques":"Can you help me buy the upcoming Malcolm Todd concert tickets on Ticketmaster? I can travel anywhere in the world. Please let me know if they're no longer available.\r","web":""}
{"id":"pay.baltimorecity.gov_citation_3","category":"ticketing","ques":"Could you help me pay my Baltimore parking tickets online through the Baltimore City website? Please let me know if there are any issues with the payment process.\r","web":""}
{"id":"etickets_sporting_event_1","category":"ticketing","ques":"Could you help me buy Calgary Stampede 2026 tickets online from eTickets.com in Calgary, AB on July 6? Please let me know if they're not available.\r","web":""}
{"id":"quickcourt.biz_citation_4","category":"ticketing","ques":"Can you help me pay my Henderson, LA traffic ticket online using QuickCourt? Please let me know if there are any issues processing the payment.\r","web":""}
{"id":"expedia_transportation_67","category":"ticketing","ques":"Can you help me find cheap plane tickets from New Orleans, LA to El Paso, TX on Expedia? Let me know if there aren't any available flights.\r","web":""}
{"id":"transact2.dmv.ny.gov_citation_3","category":"ticketing","ques":"Can you help me pay a New York traffic ticket online through the NY DMV? Please let me know if there are any issues with completing the payment.\r","web":""}
{"id":"arlandaexpress_transportation_1","category":"ticketing","ques":"Can you help me buy two round-trip Arlanda Express train tickets from Arlanda Express online? I plan on traveling leaving anytime next Friday and staying there for a week. Find discounts if possible. Let me know if they're not available.\r","web":""}
{"id":"stagepittsburgh_music_event_1","category":"ticketing","ques":"Can you help me buy tickets for any upcoming Stage AE 2026 music event at Stage AE in Pittsburgh, PA online? Let me know if they aren't available.\r","web":""}
{"id":"wetzeltaxpiled-technologies_citation_1","category":"ticketing","ques":"Can you help me pay my Wetzel County Sheriff's current tax ticket online? Please let me know if there are any issues with completing the payment.\r","web":""}
{"id":"ticketmaster_music_event_162","category":"ticketing","ques":"Can you help me buy Lady Gaga Mayhem 2026 concert tickets in California on Ticketmaster? Please let me know if they're sold out.\r","web":""}
{"id":"cityofvancouver.us_citation_1","category":"ticketing","ques":"Can you help me pay my City of Vancouver, WA parking ticket online? Please let me know if there are any issues with the payment process.\r","web":""}
{"id":"sugarbowl_other_event_1","category":"ticketing","ques":"Can you help me buy Sugar Bowl ski resort tickets online at SugarBowl.com for Lake Tahoe? I want to go with my family of 5, with 3 young kids. Let me know if it's not available anymore.\r","web":""}
{"id":"reddit_sporting_event_1","category":"ticketing","ques":"Can you help me buy Giants football tickets online the next time they play a home game? Please let me know if they're unavailable.\r","web":""}
{"id":"help.ticketmaster_music_event_10","category":"ticketing","ques":"Can you help me buy two Ariana Grande 2026 tour tickets on Ticketmaster in Los Angeles, CA? Let me know if they're not available anymore.\r","web":""}
{"id":"alltrippers_other_event_1","category":"ticketing","ques":"Can you help me buy London New Year's Eve tickets online? Please let me know if they're not available anymore.\r","web":""}
{"id":"whichmuseum_other_event_21","category":"ticketing","ques":"Can you help me buy five discounted tickets for the upcoming Sunday at 1 PM to the Greater Cleveland Aquarium in Cleveland, OH online? I have three cihldren, ages 7, 10, 13, and I'm traveling with my husband. Let me know if they're not available.\r","web":""}
{"id":"seaworld_theme_park_10","category":"ticketing","ques":"Can you help me buy SeaWorld Orlando theme park tickets online using the ID.me military discount? Please let me know if tickets aren't available.\r","web":""}
{"id":"artic.edu_other_event_1","category":"ticketing","ques":"Could you assist me in getting Art Institute of Chicago college student admission tickets online from the Art Institute of Chicago website? Please let me know if they're not available.\r","web":""}
{"id":"plandisney.disney.go_theme_park_6","category":"ticketing","ques":"Can you help me buy Disneyland theme park tickets online from Sam’s Club in Anaheim, CA? I plan on going during Christmastime with my fiance. Please let me know if they aren't available.\r","web":""}
{"id":"buy_condo_port_aransas__tx_11146","category":"realestate_complex","ques":"I'm looking to buy a condominium in Sea Gull, Port Aransas, TX, that's under $900k, with 2 or more bedrooms, a water view, and low HOA fees. Can you help me find one?\r","web":""}
{"id":"buy_land_naples__fl_13486","category":"realestate_complex","ques":"I'm interested in buying land in Naples, FL. I'd like some options with over 0.5 acres, that are new listings, have no HOA, and preferably offer a water view. Can you help me find something that fits these criteria?\r","web":""}
{"id":"buy_condo_titusville__fl_7914","category":"realestate_complex","ques":"I'm looking for a condo for sale in Titusville, Florida that’s under $500k, has 2 or more bathrooms, offers a water view, and has low HOA fees. Can you help me find something that matches these criteria?\r","web":""}
{"id":"buy_other_alice__tx_18179","category":"realestate_complex","ques":"Can you help me find a commercial property for sale in Alice, Texas that is new to the market, priced between $300k-$600k, and has central AC?\r","web":""}
{"id":"buy_house_amherst__nh_2032","category":"realestate_complex","ques":"Can you help me find a home for sale in Amherst, NH? I'm looking for something between $300k-$600k, with 4 or more bedrooms, over 2000 square feet, and in an area with top-rated schools.\r","web":""}
{"id":"buy_house_madison__wi_6412","category":"realestate_complex","ques":"I'm looking to buy a home in Madison, WI near Sunfield Street. Ideally, I'd like it to have at least 3 bedrooms, 2 bathrooms, central AC, and be located in a walkable neighborhood. Can you help me find something that fits these criteria?\r","web":""}
{"id":"buy_land_lake_county__in_4991","category":"realestate_complex","ques":"I'm looking to buy land for sale by owner in Lake County, Indiana, under $500k, over 0.5 acres, with active listings. Can you show me options that meet my criteria?\r","web":""}
{"id":"buy_house_gallatin__tn_11755","category":"realestate_complex","ques":"I'm interested in buying a home in Gallatin, TN, ideally on Duncan Ave. My budget is between $300k-$600k, and I'm looking for a place with at least 3 bedrooms, a 2-car garage, and access to top-rated schools. Could you help me find listings that meet these criteria?\r","web":""}
{"id":"rent_other_arcata__ca_7137","category":"realestate_complex","ques":"I'm looking to rent a property in Arcata, CA with 2+ bedrooms and in-unit laundry in a walkable neighborhood.\r","web":""}
{"id":"buy_house_provo__ut_15202","category":"realestate_complex","ques":"Can you help me find a house for sale in Provo, UT with 3 or more bedrooms, that's new to the market and has a mountain view?\r","web":""}
{"id":"buy_house_westfield__chatham_hills_5479","category":"realestate_complex","ques":"I'm interested in buying a home in Chatham Hills, Westfield that has 4 or more bedrooms, was built after 2000, and is near top-rated schools. Can you help me find a listing that meets these criteria?\r","web":""}
{"id":"buy_house_chambers_county__tx_2343","category":"realestate_complex","ques":"I'm looking to buy a house in Chambers County, Texas with 3+ bedrooms, 2+ bathrooms, on a large lot, and under $500k. Can you show me listings that meet these criteria?\r","web":""}
{"id":"buy_house_pittsburgh__pa_13147","category":"realestate_complex","ques":"I'm looking to buy a home with a river view in a walkable neighborhood in Pittsburgh, PA. Ideally, it should have 3+ bedrooms, 2+ bathrooms, and be built after 2000. Can you help me find something that fits these criteria?\r","web":""}
{"id":"buy_house_heath__tx_3681","category":"realestate_complex","ques":"Can you help me find new homes for sale in Heath, TX with pools, built after 2000, that have 4+ bedrooms, are new listings, and sit on large lots?\r","web":""}
{"id":"buy_house_houston__tx_15257","category":"realestate_complex","ques":"Can you help me find a move-in ready mobile home to buy in Houston, TX? I'm looking for something under $500k with 3 bedrooms and 2+ bathrooms. You can check listings for me online.\r","web":""}
{"id":"buy_house_florida_18531","category":"realestate_complex","ques":"Can you help me find homes for sale in Florida that are between $300k-$600k, have 3 or more bedrooms, central AC, and are near transit?\r","web":""}
{"id":"buy_land_gun_barrel_city__tx_4916","category":"realestate_complex","ques":"I'm interested in buying land near Gun Barrel City, TX. Can you find active listings over 0.5 acres and under $500k?\r","web":""}
{"id":"buy_house_jackson__tn_2638","category":"realestate_complex","ques":"I'm looking to buy a move-in ready home with 3 bedrooms and central AC in Jackson, TN, priced between $300k and $600k. Can you help me find one that meets these criteria?\r","web":""}
{"id":"buy_townhouse_bolingbrook__il_3053","category":"realestate_complex","ques":"Can you help me find townhomes for sale in Bolingbrook, Illinois with 3 or more bedrooms, at least 2 bathrooms, priced under $400k, and that are new to the market?\r","web":""}
{"id":"buy_house_bossier_city__la_20568","category":"realestate_complex","ques":"I'm looking to buy a small house with 3 bedrooms and 2+ bathrooms under $300k in Bossier City, LA. Can you help me find one that fits these criteria?\r","web":""}
{"id":"buy_house_denton__tx_732","category":"realestate_complex","ques":"I'm looking to buy a home in Robson Ranch, Denton with 3 bedrooms, 2+ bathrooms, an active listing, and a 2-car garage. Can you help me find something that meets these criteria?\r","web":""}
{"id":"rent_apartment_sayville__ny_10236","category":"realestate_complex","ques":"I'm searching for an apartment to rent in Sayville, NY with 2 or more bedrooms, in-unit laundry, and a walkable neighborhood. Can you help me find one?\r","web":""}
{"id":"buy_house_highland__mi_2862","category":"realestate_complex","ques":"Can you help me find homes for sale in Highland, MI with at least 3 bedrooms, 2+ bathrooms, and a large lot?\r","web":""}
{"id":"buy_house_bartlett__tn_12368","category":"realestate_complex","ques":"I'm looking to buy a home in Bartlett, TN with 4+ bedrooms, 2+ bathrooms, a large lot, and central AC. Can you find a listing that meets my criteria?\r","web":""}
{"id":"buy_house_staten_island__ny_2532","category":"realestate_complex","ques":"I'm looking to buy a house in Staten Island, NY that has 4 or more bedrooms, a large lot, and access to top-rated schools. Can you help me find a listing that meets these criteria?\r","web":""}
{"id":"buy_house_columbus__ga_10335","category":"realestate_complex","ques":"Can you show me the latest listings of homes for sale in Columbus, GA with 4+ bedrooms, 2+ bathrooms, under $400k, and central AC?\r","web":""}
{"id":"buy_house_montesano__wa_7329","category":"realestate_complex","ques":"Can you help me find houses for sale in Montesano, WA with 3 or more bedrooms, at least 2 bathrooms, on over 0.5 acres, and that are new to the market?\r","web":""}
{"id":"buy_house_jenks__ok_10654","category":"realestate_complex","ques":"I'm looking to buy a home in Jenks, Oklahoma with 3+ bedrooms, central AC, and a large lot. Can you show me listings?\r","web":""}
{"id":"buy_house_lambertville__mi_20673","category":"realestate_complex","ques":"Could you help me find homes for sale in Lambertville, MI with 3 or more bedrooms, 2 or more bathrooms, a large lot, and central AC?\r","web":""}
{"id":"buy_house_little_rock__ar_17955","category":"realestate_complex","ques":"I'm looking to buy a move-in ready small house in Little Rock, Arkansas. Ideally, it should be under $500k, have 3 bedrooms, and include a 2-car garage. Can you show me options?\r","web":""}
{"id":"rent_house_nashville__tn_8900","category":"realestate_complex","ques":"I'm looking to rent a 3-bedroom, pet-friendly house with central AC in the Morrow Rd area of Nashville, TN. Could you find listings that meet these criteria?\r","web":""}
{"id":"buy_house_the_villages__fl_14171","category":"realestate_complex","ques":"Can you help me find move-in ready homes for sale in The Villages, FL with 3+ bedrooms, 2+ bathrooms, priced between $300k-$600k?\r","web":""}
{"id":"buy_other_lafayette__co_19861","category":"realestate_complex","ques":"I'm looking for condominiums or townhouses for sale in Lafayette, CO with 2+ bathrooms, central AC, and low HOA fees. Could you find me some options?\r","web":""}
{"id":"buy_house_aiken__sc_20679","category":"realestate_complex","ques":"I'm interested in buying a home on Equinox Loop in Aiken, SC with 4+ bedrooms, 2.5+ bathrooms, a large lot, and central AC. Can you find a listing that meets these criteria?\r","web":""}
{"id":"buy_house_temperance__mi_11916","category":"realestate_complex","ques":"Can you help me find homes for sale in Temperance, Michigan with 3 or more bedrooms, at least 2 bathrooms, and priced under $500k?\r","web":""}
{"id":"buy_house_tacoma__wa_12334","category":"realestate_complex","ques":"I'm looking for homes for sale in Tacoma, WA that have 3 bedrooms, 2 or more bathrooms, and are under $500k. Can you show me some options?\r","web":""}
{"id":"rent_land_brodheadsville__pa_12988","category":"realestate_complex","ques":"I'm looking for a commercial lot for rent near Brodheadsville, PA that's under $500k, over 0.5 acres, and new to market. Can you help me find one?\r","web":""}
{"id":"buy_house_lorain__oh_13583","category":"realestate_complex","ques":"I'm looking to buy a move-in ready split level home in Lorain, Ohio with 3 bedrooms, 2+ bathrooms, and over 2000 sq ft. Could you find a listing that meets these criteria?\r","web":""}
{"id":"buy_house_hillsboro__oh_5688","category":"realestate_complex","ques":"I'm interested in buying a house with 3 or more bedrooms, a 2-car garage, a large lot, and central AC in the Hillsboro, Ohio area. Could you show me listings that meet these criteria?\r","web":""}
{"id":"buy_house_oviedo__fl_3554","category":"realestate_complex","ques":"Can you help me find a 3 bedroom house with at least 2 bathrooms in Oviedo, Florida, located near top-rated schools?\r","web":""}
{"id":"buy_house_williamstown__nj_14447","category":"realestate_complex","ques":"Could you assist me in finding move-in ready, new listings with 4 or more bedrooms for sale in Williamstown, NJ?\r","web":""}
{"id":"buy_condo_cranston__ri_16769","category":"realestate_complex","ques":"I'm looking for a condo for sale in Cranston, RI that meets the following criteria: under $500k, 2 bedrooms, low HOA fees, and located in a walkable neighborhood. Can you help me find an option that fits these requirements?\r","web":""}
{"id":"buy_house_lapeer_county__mi_19012","category":"realestate_complex","ques":"I'm searching for a home in Lapeer County, MI that's under $330k. Ideally, it should have 3 bedrooms, 2+ bathrooms, a large lot, and be move-in ready. Can you find options for me?\r","web":""}
{"id":"buy_house_omaha__ne_11006","category":"realestate_complex","ques":"I'm looking to buy a house in Omaha, NE with 4 or more bedrooms, a large lot, and near top-rated schools. Can you find a listing that meets these criteria?\r","web":""}
{"id":"buy_other_minnesota_2733","category":"realestate_complex","ques":"Can you help me find farms for sale in Minnesota that are over 0.5 acres, have central AC, are recently reduced in price, and are move-in ready?\r","web":""}
{"id":"buy_other__13924","category":"realestate_complex","ques":"I'm looking to buy an oceanfront property that is under $500k, has 4 or more bedrooms, offers a water view, and is a new construction. Can you help me find something that fits these criteria?\r","web":""}
{"id":"buy_house_4059_10th_avenue_dr_sw__nc_19159","category":"realestate_complex","ques":"Can you help me find homes with at least 3 bedrooms, 2 or more bathrooms, and built after 2000 in the SW area of North Carolina? Please show me listings that meet these criteria.\r","web":""}
{"id":"buy_house_wyoming__mi_17426","category":"realestate_complex","ques":"I'm looking to buy a home in Wyoming, MI with 3 bedrooms, 2+ bathrooms, and central AC in a walkable neighborhood. Can you show me listings that meet these criteria?\r","web":""}
{"id":"apply_apply_1239","category":"jobs","ques":"Help me apply for an administrative position listed on CareerBuilder and name at least three employers hiring for it according to CareerBuilder's listings\r","web":""}
{"id":"wildcard_wildcard_1969","category":"jobs","ques":"How many remote full time fullfillment center warehouse associate positions are available at Amazon according to their latest job listings?\r","web":""}
{"id":"apply_apply_2864","category":"jobs","ques":"Help me apply for an accounting position in Los Angeles listed on Robert Half's website and output all permanent senior accounting and  accounting manager positions according to Robert Half's listings\r","web":""}
{"id":"apply_apply_1219","category":"jobs","ques":"Help me apply for a chemistry research scientist position in Madison, WI found on LinkedIn and output five listings that would have me be an early application according to the listings. If there are less than five such listings, output them all.\r","web":""}
{"id":"pay_grades_pay_grades_1238","category":"jobs","ques":"I have a CDL. Find 3 entry-level driving jobs in Houston, TX on SimplyHired. What is the guaranteed minimum salary for each of these jobs according to the listings?\r","web":""}
{"id":"employer_landscape_employer_landscape_1359","category":"jobs","ques":"List at least three customer support specialist positions available on the Apple Careers site in New York.\r","web":""}
{"id":"job_id_job_id_127","category":"jobs","ques":"What are the locations for the motorcoach driver positions listed in Iowa on GoWindstar according to GoWindstar's job listings?\r","web":""}
{"id":"salary_range_salary_range_982","category":"jobs","ques":"What is the salary range for at least three available positions that are hiring immediately in McDonough, GA, according to the McDonough job openings page?\r","web":""}
{"id":"benefits_benefits_1624","category":"jobs","ques":"What some benefits are offered for positions listed on RL Carriers Careers?\r","web":""}
{"id":"company_size_company_size_661","category":"jobs","ques":"Tell me how many vacancies there are for Physical Scientist at NOAA on usajobs.gov and where the vacancies are located\r","web":""}
{"id":"apply_apply_2979","category":"jobs","ques":"I'm looking for a cook position that pays at least $18/hr within 25 miles of Cumming, GA. Help me apply for 5 cook positions that meet such criteria on SimpliyHired.\r","web":""}
{"id":"apply_apply_353","category":"jobs","ques":"Help me apply for an economist position in Washington, D.C. listed on USAJobs. Output at least two agencies hiring according to the listings if at least two agencies exist.\r","web":""}
{"id":"apply_apply_2635","category":"jobs","ques":"I'm looking for Home Infusion Nurse positions at the Cigna Group. How many open positions are there in California for this role?\r","web":""}
{"id":"apply_apply_2473","category":"jobs","ques":"I'm seeking a job in Charlotte, NC with Spectrum. Through the Spectrum Jobs website, find me 3 cusomter service jobs\r","web":""}
{"id":"job_titles_job_titles_139","category":"jobs","ques":"how many open opportunities are there at Howard Brown Health careers page in Chicago? What is the first position listed and its Requisition Number?\r","web":""}
{"id":"responsibilities_responsibilities_1537","category":"jobs","ques":"what are the first three \"essential functions\" of a driver with Fedex Freight as listed on one of their job postings?\r","web":""}
{"id":"apply_apply_1546","category":"jobs","ques":"Help me apply for 3 retail sales associate positions near Glen Burnie, MD  that are friendly to veternas\r","web":""}
{"id":"job_id_job_id_253","category":"jobs","ques":"What is the requisition number, salary range, and posting closing date of the first \"comptroller\" job listed on https://jobs.myflorida.com/? And who is the office contact?\r","web":""}
{"id":"apply_apply_2317","category":"jobs","ques":"Help me apply for a customer support position at Thermo Fisher Scientific on their career page. I am looking for a position that only requires a high school diploma, and I would prefer it to be remote.\r","web":""}
{"id":"wording_wording_163","category":"jobs","ques":"What is the exact wording of the first sentence of the job description for a paralegal position on the Nevada Bar Jobs site? Output the job ID as well for my later reference.\r","web":""}
{"id":"wording_wording_2464","category":"jobs","ques":"Find  the exact wording of the first sentence of a job description on The Bair Foundation's Careers page based in Pennsylvania. Also return the ID of the job.\r","web":""}
{"id":"apply_apply_2810","category":"jobs","ques":"I have experience with the Microsoft Office Suite and covers medical insurance. Help me apply for a logistics coordinator position that meets such requirements in Miami, FL using CareerBuilder.\r","web":""}
{"id":"employer_landscape_employer_landscape_961","category":"jobs","ques":"Help me apply for a police officer position in Soldotna, AK  on their government jobs portal if it still exists, and tell me which form I need to fill out and what the hourly wage is.\r","web":""}
{"id":"apply_apply_2022","category":"jobs","ques":"Help me apply for an anthropologist (i.e. researcher, scientist, or professor) position in Washington, D.C. listed on Careers in Anthropology, if available, with a minimum salary of $60,000. Output three organiziations, univerisites, or companies hiring that meets these constraints according to these listings\r","web":""}
{"id":"apply_apply_1003","category":"jobs","ques":"Help me apply for a full-time sales position at Farmers Insurance by navigating their careers page in the US, and let me know if none exist. List the three closest listings to Boston, MA if at least three exist.\r","web":""}
{"id":"salary_range_salary_range_1277","category":"jobs","ques":"What is the salary range for finance positions available at Bank of Texas in Dallas, TX as listed on BOK Financial's career site, specifically for full-time roles? Output at least three of the job listings and the required years of experience for those positions.\r","web":""}
{"id":"apply_apply_174","category":"jobs","ques":"Help me apply for a computer science position located in Rancho Cucamonga, CA, with a minimum salary of $80,000 if available, using LinkedIn. Provide 5  URLs to forms for me to fill out myself.\r","web":""}
{"id":"benefits_benefits_2600","category":"jobs","ques":"Output at least three psychologist positions and their benefits in Kentucky found on LinkedIn that require a Master's degree, if available? Provide links to their forms for job application as well in your output\r","web":""}
{"id":"salary_range_salary_range_1684","category":"jobs","ques":"What is the salary range for any job opening listed on the SSENSE Careers page requiring a Bachelor's degree, if available? Provide a URL for such a job if it exists.\r","web":""}
{"id":"responsibilities_responsibilities_1471","category":"jobs","ques":"What are the main responsibilities listed in a production operations job posting at Grande Cheese from their careers page, specifically for positions that require a minimum of three years of relevant experience?\r","web":""}
{"id":"qualifications_qualifications_724","category":"jobs","ques":"What are the qualifications for environmental scientist positions listed on the South Florida Water Management District careers page open to the public? How do the qualifications vary across listings?\r","web":""}
{"id":"wildcard_wildcard_2597","category":"jobs","ques":"List the salary or salary ranges for five different filing tax consultant positions based in Chicago, IL on Robert Half that require a CPA certification? Output pairs of (employers, salary) in decreasing order of salary.\r","web":""}
{"id":"responsibilities_responsibilities_2088","category":"jobs","ques":"What are the main responsibilities listed in the first administrative position post in Mililani, Hawaii that offers health insurance, if available? Output a link to the job listing as well.\r","web":""}
{"id":"salary_range_salary_range_633","category":"jobs","ques":"What is the salary range for the first logistics coordinator job posting in Miami, FL on LinkedIn, if any exist? Does the job require full-time on-site? How many people does it indicate have already applied?\r","web":""}
{"id":"apply_apply_2722","category":"jobs","ques":"Help me apply for a mid-level software development position at Amazon by reviewing available job postings on their official careers site that offer have a six-figure salary and require proficiency in JavaScript, if any exist. Provide a link to the form for the job.\r","web":""}
{"id":"employer_landscape_employer_landscape_624","category":"jobs","ques":"Can you find any roles for equipment operator positions in Houston, prefereably but not necessarily from Waste Management, offering a minimum salary of $50,000 and at least three years of experience, if available.\r","web":""}
{"id":"apply_apply_2720","category":"jobs","ques":"Help me apply for a finance position at Veritas Partners by exploring opportunities available on HireVeritas. I have five years of work experience and a bachelors in finance, which role would be most appropriate for me?\r","web":""}
{"id":"apply_apply_1288","category":"jobs","ques":"Help me apply for a dentist position in Kentucky on the ADA CareerCenter with at least 401 (k) benefits and effective pay of at least $100/hr, if any exist.\r","web":""}
{"id":"wording_wording_2838","category":"jobs","ques":"What is the exact wording of the first sentence of the job description for the first airline job opening listed in Atlanta on ATL Careers that offers a minimum salary of $50,000 and requires a Bachelor's degree, if any exist? Direct me to a form to the job from the listing as well. Pre-fill the form with the city and state being Atlanta and Georiga, respectively.\r","web":""}
{"id":"apply_apply_1737","category":"jobs","ques":"Help me apply for a firefighter position in Orange County, CA on GovernmentJobs that offers a minimum salary of $50,000 and is open to applicants with a Bachelor's degree, if any exist. List at least three such job postings and summarize how they differ at a high level.\r","web":""}
{"id":"apply_apply_410","category":"jobs","ques":"Help me apply for a maintenance job located in Chicago, IL, that offers a minimum salary of $50,000 and requires at least two years of experience, if any exist. What's a suitable option that can hire immediately?\r","web":""}
{"id":"requirements_requirements_7","category":"jobs","ques":"What are the in-person requirements listed for Kroger jobs available in Atlanta, GA on Kroger Family Careers that are full-time positions and offer health insurance, if any exist? What are the hours like for such positions based on the listings?\r","web":""}
{"id":"apply_apply_2","category":"jobs","ques":"Help me apply for three administrative position in Minnesota listed on GovernmentJobs that pays at least $18/hr and requires a high school diploma, if any exist.\r","web":""}
{"id":"job_titles_job_titles_2726","category":"jobs","ques":"List the titles of available cashier positions at Walmart on their careers page that are full-time and within 10 miles of Chicago, if any exist. What are the 401(k) benefits and salary range?\r","web":""}
{"id":"job_id_job_id_1431","category":"jobs","ques":"What are the job numbers/ID s of three full-time warehouse supervisor positions in the greater Chicago area listed on SimplyHired that offers at least a $60,000 annual salary and requires a bachelor's degree, if any exist? What are the benefits of each of the positions? How many years of experience are required for each one?\r","web":""}
{"id":"employer_landscape_employer_landscape_2701","category":"jobs","ques":"find a store manager or assistant store manager position at dollar general close to new york, NY and tell me the location of the first such listing\r","web":""}
{"id":"salary_range_salary_range_2829","category":"jobs","ques":"is Triomics hiring? Can you tell me the job that has the highest salary that they are hiring for, and would I qualify for it given that I have a masters in clinical biology?\r","web":""}
{"id":"wildcard_wildcard_542","category":"jobs","ques":"What are the 3 most recent job openings shown on The Lash Lounge Careers site and what locations are they for?\r","web":""}
{"id":"qualifications_qualifications_2504","category":"jobs","ques":"I want to apply for a position at Bluegrass Chiro in kentucky; how many positions do they have open and what roles are they for?\r","web":""}
{"id":"apply_apply_50","category":"jobs","ques":"Help me apply for a full-time security position in Florida with allied universal, let me know the requisition id.","web":""}

================================================
FILE: packages/evals/datasets/webvoyager/WebVoyager_data.jsonl
================================================
{"web_name": "Allrecipes", "id": "Allrecipes--0", "ques": "Provide a recipe for vegetarian lasagna with more than 100 reviews and a rating of at least 4.5 stars suitable for 6 people.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--1", "ques": "Find a recipe for a vegetarian lasagna that has at least a four-star rating and uses zucchini.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--2", "ques": "Find a recipe for a vegetarian lasagna under 600 calories per serving that has a prep time of less than 1 hour.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--3", "ques": "Locate a recipe for vegan chocolate chip cookies with over 60 reviews and a rating of at least 4.5 stars on Allrecipes.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--4", "ques": "Find a recipe for Baked Salmon that takes less than 30 minutes to prepare and has at least a 4 star rating based on user reviews.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--5", "ques": "Search for a popular Pasta Sauce with more than 1000 reviews and a rating above 4 stars. Create a shopping list of ingredients for this recipe.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--6", "ques": "Search for a vegetarian lasagna recipe that has at least a four-star rating and over 500 reviews.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--7", "ques": "Find a popular recipe for a chocolate chip cookie and list the ingredients and preparation steps.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--8", "ques": "Search for a recipe for Beef Wellington on Allrecipes that has at least 200 reviews and an average rating of 4.5 stars or higher. List the main ingredients required for the dish.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--9", "ques": "Find a high-rated recipe for vegetarian lasagna, list the key ingredients required, and include the total preparation and cook time stated on the recipe.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--10", "ques": "Find The Most Popular Recipes of the 1960s, noting the recipe name, preparation time and total time of the second recipe in this collection.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--11", "ques": "Discover a suitable chocolate cupcake recipe on Allrecipes that has a preparation time of under 1 hour and at least 100 user reviews.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--12", "ques": "Search for a popular cookie recipe on Allrecipes with more than 1000 reviews and a rating of 4.5 stars or better. Provide the list of ingredients needed.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--13", "ques": "Find a recipe with over 100 reviews for Fried Fish on Allrecipes, list the Full Nutrition Label and tell me the amount of Iron per Serving.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--14", "ques": "Search for a recipe that includes \"chicken breast\" and \"quinoa\" with preparation time under 30 minutes on Allrecipes.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--15", "ques": "Choose a dessert recipe on Allrecipes with a prep time of less than 30 minutes, has chocolate as an ingredient, and has a user rating of 4 stars or higher. Provide the name of the recipe, ingredients list, and step-by-step instructions.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--16", "ques": "Find a five-star rated chocolate chip cookie recipe that takes less than 1 hour to make on Allrecipes. Note how many reviews the recipe has and the main ingredients required.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--17", "ques": "Find the Easy Vegetarian Spinach Lasagna recipe on Allrecipes and tell me what the latest review says.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--18", "ques": "Find a recipe for a vegetarian lasagna that has over 300 reviews and an average rating of 4.5 or higher on Allrecipes.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--19", "ques": "Find a vegan lasagna recipe on Allrecipes that requires 10 ingredients or less and has feedback of more than 200 reviews. Provide a brief overview of the ingredient list and the total prep and cook time.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--20", "ques": "Find a recipe for a cauliflower pizza crust that has a preparation time of under 30 minutes and a rating of at least 4 stars on Allrecipes. Include the number of calories per serving.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--21", "ques": "Locate a high-rated recipe for gluten-free brownies on Allrecipes with at least 50 reviews. List the main ingredients and the total time required for preparation and cooking.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--22", "ques": "Find a recipe for a healthy avocado salad on Allrecipes that has a preparation time of less than 20 minutes and more than 30 user reviews. Include the nutritional information per serving.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--23", "ques": "Search Allrecipes for a baked lemon chicken recipe that has a prep time under 45 minutes, with at least a 4.5-star rating based on user reviews, and over 200 reviews. List the primary ingredients required.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--24", "ques": "Locate a recipe for an eggplant Parmesan on Allrecipes with a rating of at least 4.5 stars and over 50 reviews. Include the preparation time and the number of servings provided by the recipe.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--25", "ques": "Find a popular quinoa salad recipe on Allrecipes with more than 500 reviews and a rating above 4 stars. Create a shopping list of ingredients for this recipe and include the total cooking and preparation time.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--26", "ques": "Search for a high-protein vegetarian chili recipe on Allrecipes that has at least 50 reviews and a rating of 4 stars or higher. Provide the ingredient list, cooking time, and a brief description of the cooking steps.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--27", "ques": "Locate a chicken curry recipe on Allrecipes that has been reviewed more than 30 times and has a rating of at least 4 stars. Provide a summary of the recipe including ingredients, preparation time, and cooking instructions.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--28", "ques": "On Allrecipes, find a vegan brownie recipe that has at least 40 reviews and a rating of 4.5 or higher. Include the list of ingredients, total prep and cook time, and a brief overview of the preparation steps.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--29", "ques": "Search for a Mediterranean-style grilled fish recipe on Allrecipes that includes ingredients like olives, has at least a 4-star rating, and more than 25 reviews. Detail the ingredients, cooking method, and total time required for preparation and cooking.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--30", "ques": "Find a recipe for a vegan smoothie bowl on Allrecipes that includes bananas and leaves, has more than 20 reviews, and a rating of at least 4 stars. Provide a list of ingredients, preparation time, and a summary of the recipe steps.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--31", "ques": "Search for a seafood paella recipe on Allrecipes with a minimum of 4.5 stars rating and at least 50 reviews. The recipe should include shrimp and mussels. Provide the ingredients, total time, and an overview of the preparation steps.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--32", "ques": "Find a high-rated beef stew recipe on Allrecipes that requires a slow cooker and has at least 30 reviews. Detail the cooking time and the first five ingredients listed in the recipe.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--33", "ques": "Find a recipe for a low-carb breakfast on Allrecipes with at least 25 reviews. Show the Nutrition Facts and the total carbohydrate content per serving.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--34", "ques": "Locate a baked salmon recipe on Allrecipes that has at least 50 reviews and a rating of 4.5 stars or higher. Note the primary seasoning or herb used and the estimated cooking time.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--35", "ques": "Search for an Italian-style meatball recipe on Allrecipes that has more than 100 reviews. Detail the type of meat used and the overall cooking time required.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--36", "ques": "Locate a recipe for an American apple pie on Allrecipes with a rating of at least 4 stars and more than 50 reviews. Note the maximum temperature mentioned in the Directions.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--37", "ques": "Search for a Greek salad recipe on Allrecipes that has a prep time of under 25 minutes and more than 15 reviews. Include the primary cheese used and the type of dressing recommended.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--38", "ques": "Find a French ratatouille recipe on Allrecipes with a 4-star rating or higher and at least 15 reviews. Note the variety of vegetables included and the overall cooking time.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--39", "ques": "Locate a recipe for sushi rolls on Allrecipes with a minimum of 20 reviews. Show the Nutrition Facts and the main ingredients. Tell me how to store these rolls.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--40", "ques": "Browse the about us section of Allrecipes for a brief introduction to The Allrecipes Allstars.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--41", "ques": "List 3 recommended dinner recipes in the Allrecipes Dinners section.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--42", "ques": "Find a recipe for banana bread with more than 200 reviews and a rating of at least 4.0 stars on Allrecipes.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--43", "ques": "Find a recipe for a vegan pumpkin pie on Allrecipes with a minimum four-star rating and a total cook time exceeding 1 hour.", "web": "https://www.allrecipes.com/"}
{"web_name": "Allrecipes", "id": "Allrecipes--44", "ques": "List at least 6 holiday recipes sections mentioned in the Occasions section of Allrecipes.", "web": "https://www.allrecipes.com/"}
{"web_name": "Amazon", "id": "Amazon--0", "ques": "Search an Xbox Wireless controller with green color and rated above 4 stars.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--1", "ques": "Search for women's golf polos in m size, priced between 50 to 75 dollars, and save the lowest priced among results.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--2", "ques": "Find a gaming desktop with Windows 11 Home, and the disk size should be 1TB.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--3", "ques": "Find climbing gears and sort the results by price high to low. Answer the first 3 results after sorting.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--4", "ques": "Find the used Nintendo Switch Lite on Amazon then filter by 'Used - Good', tell me the cheapest one that is 'Used - Good'.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--5", "ques": "Find a Blue iPhone 12 Pro 128gb and add to cart.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--6", "ques": "Browse black strollers within $100 to $200 on Amazon. Then find one Among these black strollers with over 20,000 reviews and a rating greater than 4 star.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--7", "ques": "Browse the women's hiking boots on Amazon and filter the results to show only those that are waterproof and have a rating of at least 4 stars and size 6.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--8", "ques": "Find the cheapest Samsung-made Android tablet with screen between 10-10.9 inches on Amazon. Only answer the cheapest one.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--9", "ques": "Find a dog bed on Amazon that is washable and has a length of at least 30 inches.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--10", "ques": "Find the cost of a 2-year protection for PS4 on Amazon.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--11", "ques": "Find a stainless steel kitchen sink with double bowls on Amazon. Sort the results and find the cheapest one with FREE delivery.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--12", "ques": "Check reviews for a Ride On Car with 100+ reviews & 4+ stars rating on Amazon. Give me the top review about this Ride On Car.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--13", "ques": "Browse best selling black hoodies in mens size Big and Tall that is between $25 and $50 on Amazon.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--14", "ques": "Find the new surge protector on Amazon with 6 to 8 outlets under 25 dollars with customer reviews above 4+ stars.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--15", "ques": "Find a pair of mens running shoes in black, size 7, 4+ stars and under $50 and add them to my cart on Amazon.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--16", "ques": "Find the Return Policy for Mens Rhinestone Skull Graphic Shirt on Amazon. Color: Black, Size: XX-Large. If Free return is avaliable, tell me how to return this item.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--17", "ques": "Show me the list of baby products that are on sale and under 10 dollars on Amazon. Provide at least 2 on sale products", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--18", "ques": "Open Amazon's home page and tell me what the deal is that is going on at the moment, list the names of at least 2 items that are on offer and tell me what percent off they are.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--19", "ques": "Look for an English language book on roman empire history in the Amazon Kindle store. Sort by newests arrivals and look for a title that will be released within a month.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--20", "ques": "Search for a wireless ergonomic keyboard with backlighting and a rating of at least 4 stars. The price should be between $40 to $60. Save the product with the 500+ customer reviews.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--21", "ques": "Find a stainless steel, 12-cup programmable coffee maker on Amazon. The price range should be between $100 to $200. Report the one with the 4+ customer rating.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--22", "ques": "Search for a set of non-stick, oven-safe cookware on Amazon. The set should include at least 10 pieces and be priced under $150.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--23", "ques": "Look for a men's waterproof digital sports watch with a heart rate monitor on Amazon. It should be priced between $50 to $100.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--24", "ques": "Browse for a compact air fryer on Amazon with a capacity of 2 to 3 quarts. It should have a digital display, auto shutoff and be priced under $100.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--25", "ques": "Search for a queen-sized, hypoallergenic mattress topper on Amazon. It should have a memory foam material and be priced between $50 to $100.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--26", "ques": "Find a portable Bluetooth speaker on Amazon with a water-resistant design, under $50. It should have a minimum battery life of 10 hours.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--27", "ques": "Look for a USB-C hub on Amazon compatible with MacBook Pro, featuring at least 4 ports, including HDMI and SD card reader. The price should be under $50. Select the one after sorting by Best Sellers.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--28", "ques": "Search for a yoga mat on Amazon that is at least 6mm thick, non-slip, and eco-friendly. The price should be under $50.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--29", "ques": "Find a set of solar-powered garden lights on Amazon with a minimum pack of 10 lights. They should be LED and priced under $50.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--30", "ques": "Locate the highest-rated fiction book released in 2024 on Amazon, with a minimum of 50 customer reviews.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--31", "ques": "Find a compact digital camera on Amazon with a zoom capability of at least 10x, rated 4 stars or higher, and priced between $100 to $300.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--32", "ques": "Search for an electric kettle on Amazon with a capacity of at least 1.5 liters, made of stainless steel, and with a customer rating of 4 stars or above.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--33", "ques": "Search for a portable air conditioner on Amazon suitable for a room size of 300 sq ft, with energy efficiency rating, and compare the prices of the top three search results.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--34", "ques": "Find a beginner's acrylic paint set on Amazon, with at least 24 colors, suitable for canvas painting, and priced under $40.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--35", "ques": "Find a men's leather wallet on Amazon with RFID blocking, at least 6 card slots, and priced below $50. Check if it's available for FREE delivery.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--36", "ques": "Search for a children's science experiment kit on Amazon suitable for ages 8-13, with at least a 4-star rating and priced under $30.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--37", "ques": "Locate a queen-sized bedspread on Amazon with a floral pattern, and check if it's available in blue color.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--38", "ques": "Find a bird feeder on Amazon suitable for small birds, with an anti-squirrel mechanism, and check if it's available with free shipping.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--39", "ques": "Locate a travel guide book on Amazon for Japan, published in 2024, with at least 20 customer reviews.", "web": "https://www.amazon.com/"}
{"web_name": "Amazon", "id": "Amazon--40", "ques": "Locate a women's yoga mat in purple, with a thickness of at least 5mm, rated 4+ stars, and priced under $30 on Amazon. Check how many colors are available in total, and what is the return and delivery policy.", "web": "https://www.amazon.com/"}
{"web_name": "Apple", "id": "Apple--0", "ques": "Compare the prices of the latest models of MacBook Air available on Apple's website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--1", "ques": "Research the new features of the iOS 17 on Apple support and check its compatibility with the iPhone 12.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--2", "ques": "Compare the prices and chips for the iPhone 14 Pro and iPhone 15 Pro models directly from Apple's website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--3", "ques": "Find the latest model of the iPhone and compare the price and screen size between the pro and pro max.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--4", "ques": "How much does it cost to buy a Macbook pro, 16-inch, Apple M3 Max chip with 16-core CPU, 40-core GPU, 64GB unified memory, 1TB SSD.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--5", "ques": "Check the release date and price for the latest version of the iPhone.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--6", "ques": "Find AirPods on Apple and how many types are currently available.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--7", "ques": "When and where the Apple Vision Pro will be released.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--8", "ques": "Identify and list the specifications of the latest iPad model released by Apple, including its storage options, processor type, and display features.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--9", "ques": "Check the Apple Store for the availability of the latest iPhone model and schedule an in-store pickup at the nearest Apple Store for January 10, 2024.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--10", "ques": "Find information on the latest (as of today's date) MacBook model, including its key features such as processor type, memory size, and storage capacity.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--11", "ques": "Get information about the latest iPad model released by Apple, including its release date, base storage capacity, and starting price available on Apple's official website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--12", "ques": "What Apple Repair ways are mentioned on apple website, answer 2 of them.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--13", "ques": "How many colors does the latest MacBook Air come in?", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--14", "ques": "Identify the upgrade options available for the cheapest base model of the MacBook Pro 14-inch with M3 chip, and calculate the total price difference from the base model to the maximum upgrade (no Pre-Installed Software) offered by Apple.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--15", "ques": "On Apple's website, how many different types of keyboards are available when customizing your 14-inch MacBook Pro?", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--16", "ques": "Find on Apple website how many types of AirPods (3rd generation) are available and what is the price difference.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--17", "ques": "Search Apple for the accessory Smart Folio for iPad and check the closest pickup availability next to zip code 90038.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--18", "ques": "Check if there are trade-in offers for the latest model of iPhone.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--19", "ques": "On Apple's website, what is the slogan for the Mac and what is the slogan for the Macbook pro.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--20", "ques": "Check the price for an Apple iPhone 14 Plus with 256GB storage in Purple color.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--21", "ques": "Identify the available storage options for the latest iPad Pro on the Apple website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--22", "ques": "Find out the trade-in value for an iPhone 13 Pro Max in good condition on the Apple website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--23", "ques": "Determine the price difference between the latest series of Apple Watch and Apple Watch SE on the Apple website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--24", "ques": "Find out the starting price for the most recent model of the iMac on the Apple website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--25", "ques": "On the Apple website, look up the processor for the latest model of the Apple TV.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--26", "ques": "Find the maximum video recording resolution supported by the latest iPad mini on the Apple website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--27", "ques": "On Apple's website, check if the HomePod mini in store is available in multiple colors and list them.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--28", "ques": "On the Apple website, find out if the Mac Mini can be configured with a GPU larger than 16-core.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--29", "ques": "On Apple's website, check the estimated battery life of the latest MacBook Air during web browsing in Tech Specs.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--30", "ques": "Check the storage options and prices for the latest iPad Pro models on Apple's website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--31", "ques": "On Apple's website, what is the slogan for the latest Apple Watch Series.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--32", "ques": "Investigate the trade-in value for an iPhone 11 Pro Max on Apple's website.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--33", "ques": "Look for the color options available for the newest iMac.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--34", "ques": "Identify the size and weight for the Apple TV 4K and list the Siri Remote features introduced.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--35", "ques": "How many types of Apple Pencil are currently available on the Apple's website? Which one supports Wireless pairing and charging.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--36", "ques": "Browse Apple Music on the entertainment section of the Apple's website, and see which singers' names are included in the pictures on this page.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--37", "ques": "Compare the color options of iPhone 13 Pro, iPhone 14 Pro and iPhone 15 Pro.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--38", "ques": "Explore accessories for Apple Vision Pro, list at least three accessories.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--39", "ques": "Find solutions on Apple's website if you forgot your Apple ID password.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--40", "ques": "Find information on Apple website, and tell me the device weight of Apple Vision Pro and list 5 Built-in Apps it supports.", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--41", "ques": "How much does it cost to buy an ipad mini with 64GB storage and Wi-Fi + Cellular connectivity? (no engraving, no apple pencil, no smart folio, no apple trade-in).", "web": "https://www.apple.com/"}
{"web_name": "Apple", "id": "Apple--42", "ques": "Find updates for Apple Watch Series 7,8,9 on Apple's website.", "web": "https://www.apple.com/"}
{"web_name": "ArXiv", "id": "ArXiv--0", "ques": "Search for the latest preprints about 'quantum computing'.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--1", "ques": "Search for the latest research papers on quantum computing submitted to ArXiv within the last two days.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--2", "ques": "Look up the most recent papers related to 'cs.CL', select one and show its abstract.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--3", "ques": "Locate the most recent research paper about 'Algebraic Topology' under Mathematics published on ArXiv. Provide the title of the paper, the name of the authors, and the abstract.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--4", "ques": "Find the most recent research papers in Astrophysics of Galaxies. How many papers have been announced in the last day?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--5", "ques": "Search papers about \"quantum computing\" which has been submitted to the Quantum Physics category on ArXiv. How many results in total. What if search in all archives?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--6", "ques": "How many figures and tables are in the paper \"On the Sentence Embeddings from Pre-trained Language Models\"?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--7", "ques": "Find the most recent paper submitted on machine learning in the Computer Science category posted on ArXiv.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--8", "ques": "What is the latest news on ArXiv?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--9", "ques": "Find the latest research paper about neural networks published on ArXiv which has been submitted within the last week.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--10", "ques": "Visit ArXiv Help on how to withdraw an article if the submission is not yet announced.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--11", "ques": "For Non-English submissions, do I need to provide a multi-language abstract, if need, answer the separator between the multiple abstracts.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--12", "ques": "Find store in arXiv Help, tell me how many styles of arXiv Logo Shirt are available?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--13", "ques": "How many articles on ArXiv with 'SimCSE' in the title?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--14", "ques": "On ArXiv, how many articles have 'SimCSE' in the article and are originally announced in October 2023?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--15", "ques": "Searching Chinese Benchmark on ArXiv, how many papers announced in December 2023 mention being accepted for AAAI 2024?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--16", "ques": "Locate the latest research about gravitational waves that were uploaded to ArXiv this week and provide a brief summary of one article's main findings.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--17", "ques": "Find the paper 'GPT-4 Technical Report', when was v3 submitted?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--18", "ques": "Download the paper 'Dense Passage Retrieval for Open-Domain Question Answering'. How many formulas are in the article and which one is the loss function?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--19", "ques": "Which university maintains and manages ArXiv. Accessing the university's website from ArXiv, how many underegraduate students are currently at the university.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--20", "ques": "Find the latest paper on 'machine learning in the Statistics section of ArXiv and provide its abstract.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--21", "ques": "Search for papers on 'neural networks for image processing' in the Computer Science category on ArXiv and report how many were submitted in the last week.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--22", "ques": "Locate the ArXiv Help section and find instructions on how to subscribe to daily listing emails for new submissions in a specific category.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--23", "ques": "Determine how many articles with the keyword 'autonomous vehicles' were published in the 'Electrical Engineering and Systems Science' section of ArXiv yesterday.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--24", "ques": "Identify the most recent paper related to 'graph neural networks' on ArXiv and determine the affiliation of the first author.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--25", "ques": "Browse the ArXiv store and let me know how many different types of merchandise are available.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--26", "ques": "Search for papers related to 'climate change modeling' on ArXiv and find out how many have been published in the Earth and Planetary Astrophysics (astro-ph.EP) category in the last week.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--27", "ques": "On ArXiv, what categories does Economics include, and what are their abbreviations?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--28", "ques": "Search 'Poly encoder' by title on ArXiv and check whether the articles in the search results provide HTML access.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--29", "ques": "On ArXiv, search for papers with 'Neural Network Optimization' in the title published in 2023, and provide the number of such papers.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--30", "ques": "Look up the submission guidelines on ArXiv for submitting a paper and tell me the formats for figures.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--31", "ques": "Search ArXiv for papers with 'Graph Neural Networks' in the abstract that were submitted between Jan 1, 2024, and Jan 3, 2024, and determine how many of these papers have more than five authors.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--32", "ques": "Locate the latest paper on ArXiv within the 'Nonlinear Sciences - Chaotic Dynamics' category, summarize the abstract and note the submission date.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--33", "ques": "Query ArXiv for the latest research article in the category of Systems and Control under Computer Science. Summarize the main objective or hypothesis presented in the paper and provide the names of the authors.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--34", "ques": "Search for the most recent paper related to non-commutative geometry submitted by an author with the first name John. Provide the title and the abstract.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--35", "ques": "Retrieve the latest research paper in Quantum Physics from ArXiv and provide the title, author(s), and date of submission.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--36", "ques": "Search 'CVPR 2023' and 'CVPR2023' through journal ref on ArXiv to see how many results there are respectively.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--37", "ques": "Find the names of people in ArXiv's Leadership Team.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--38", "ques": "Find the ArXiv Blog on the ArXiv website and summarize the content of its latest article.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--39", "ques": "Search the title 'GPT-4 Technical Report' and access this paper through HTML format. Read the paper on this page and tell me what is 'one of the main goals of developing such models' mentioned in the Introduction.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--40", "ques": "How many articles are there on each of the three most recent announce days in the Solar and Stellar Astrophysics section of ArXiv. Choose one at random and answer its title and when the first version was uploaded?", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--41", "ques": "Find the button to share arxiv non-profit store and follow the QR code to share the shop. Then add arXiv Forever short sleeve (XL) to your cart.", "web": "https://arxiv.org/"}
{"web_name": "ArXiv", "id": "ArXiv--42", "ques": "Find an article published between 1 January 2000 and 1 January 2005 that requires Support Vector Machines in the title and its Journey ref is ACL Workshop.", "web": "https://arxiv.org/"}
{"web_name": "BBC News", "id": "BBC News--0", "ques": "Find a report on the BBC News website about recent developments in renewable energy technologies in the UK.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--1", "ques": "Read the latest health-related news article published on BBC News and summarize the key points discussed.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--2", "ques": "Read the latest article regarding the environmental impacts of deforestation published within the last two days.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--3", "ques": "Check the leaderboard for Golf's DP World Tour in the SPORT section, what was the name of the most recent tournament, and how many teams have a Total of -10 strokes.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--4", "ques": "Find the latest article regarding the economic implications of climate change in Europe as reported by BBC News and summarize the central points.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--5", "ques": "Find the article \"What is climate change? A really simple guide\" and use it to answer what human activities are causing climate change.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--6", "ques": "Find the top story from BBC News in the technology section for today.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--7", "ques": "Find a AI-related story under Technology of Business. What is in the first picture in the story?", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--8", "ques": "Get a brief overview of the economic implications of the UK's latest trade deal posted on BBC News and the date when the article was published.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--9", "ques": "Find out which musician made the headlines in Music News.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--10", "ques": "Identify the main headlines covering the UK's plan to tackle climate change on BBC News.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--11", "ques": "Find out how many teams are in the Scottish Premiership of the Football Tournament and when did the Hibernian team's most recent match start?", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--12", "ques": "Find a picture in the travel section that contains food, tell me what the food is called and what region it comes from.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--13", "ques": "Search for recent news related to Trump and summarize the main points.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--14", "ques": "Find a news article on BBC News about the impact of the recent tech industry layoffs on the global economy. Summarize the key points and the name of the author, and provide the date of publication.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--15", "ques": "What does the current headline in Natural Wonders tell about.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--16", "ques": "Identify the most recent development or update in Brexit negotiations as reported on BBC News and report the key points and any stated impacts on European economies.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--17", "ques": "How many War related sections are currently in BBC News.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--18", "ques": "Visit BBC News Audio, What are the best PodCasts for 2023? List 2 of them.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--19", "ques": "Visit the Athletics calendar for the date of the next earliest game.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--20", "ques": "Find the latest article in the Green Living section on BBC News and provide a summary of its main points.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--21", "ques": "Identify the top headline in the World News section on BBC News and describe the region it is related to.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--22", "ques": "Determine the current top business story on BBC News and give a brief overview of its economic implications.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--23", "ques": "Identify the latest health-related news on BBC News and summarize the main findings or recommendations.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--24", "ques": "Search the latest article about space exploration on BBC News and summarize its key points.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--25", "ques": "Find the most recent sports analysis article on BBC News related to the English Premier League and summarize its key insights.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--26", "ques": "Locate the latest report on BBC News about the impact of recent natural disasters in Asia and summarize the key points and areas affected.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--27", "ques": "Find the most recent article on BBC News about archaeological discoveries and summarize the main findings and their significance.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--28", "ques": "Find the Market Data section on BBC News and tell me which company the data comes from.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--29", "ques": "Visit BBC News Audio and find out which podcast episode is currently featured as the \"New Releases\".", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--30", "ques": "In the Culture section, identify the latest film release reviewed and provide a brief summary of the review.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--31", "ques": "Check the Sports section for the result of the most recent Manchester United football match.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--32", "ques": "Find the artificial intelligence section, what is the top headline at this time, and which companies are involved?", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--33", "ques": "In the World News section, find the latest war situations of Middle East and provide a brief summary.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--34", "ques": "Find The SpeciaList section in Travel and browse the page to see which cities are mentioned.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--35", "ques": "In the Asia section, browse and identify the most recent report about technological advancements and summarize its content.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--36", "ques": "Look up recent articles in the Africa news section in World, summarize what topics most of these news are about", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--37", "ques": "Identify the latest book review featured in the Culture section and provide the title and author of the book.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--38", "ques": "Find news related to the storm in Weather section and indicate where and when the severe weather occurred.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--39", "ques": "Check the Horse Racing results in Sport section, browse all the games that took place yesterday and see which one had the highest number of runners.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--40", "ques": "Read and summarise a recent story on BBC News about people being injured or killed in wars.", "web": "https://www.bbc.com/news/"}
{"web_name": "BBC News", "id": "BBC News--41", "ques": "Find Golf in BBC News, check the Leaderboard at this point in Women's Majors and count which country has the most players in the top 20? Which player has the best score amongst the Australian players and in what place.", "web": "https://www.bbc.com/news/"}
{"web_name": "Booking", "id": "Booking--0", "ques": "Find a Mexico hotel with deals for December 25-26.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--1", "ques": "Find the cheapest available hotel room for a three night stay from 1st Jan in Jakarta. The room is for 2 adults, just answer the cheapest hotel room and the price.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--2", "ques": "Find a hotel in Ohio From December 20th to December 23th for 3 adults and 2 rooms.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--3", "ques": "Find a hotel with 4 star and above rating in Los Angeles for 3 days from Dec 18th.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--4", "ques": "Search for the cheapest Hotel near Kashi Vishwanath Temple that offer breakfast from Dec 25th - Dec 26th.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--5", "ques": "Search a hotel with free WiFi and air conditioning in Bali from Jan 1 to Jan 4, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--6", "ques": "Book one room which provides breakfast, and airport shuttle from Jan 22 to 25 in Los Angeles.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--7", "ques": "Find a hotel room on January 3-6 that is closest to National University of Singapore and costs less than $500", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--8", "ques": "Get the hotel with highest review score and free cancelation in Chennai for 20/12/2023 - 21/12/2023.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--9", "ques": "Find hotels for 2 adults in London with a price less than 250 dollars for four days starting from December 25. You must browse the page and offer at least 3 options.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--10", "ques": "Find a well-reviewed hotel in Paris with available bookings suitable for a couple (2 adults) on Valentine's Day week, February 14-21, 2024, that offers free cancellation options.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--11", "ques": "Reserve a hotel in downtown Chicago with a rating of 9 or higher for a stay from March 20-27, 2024, which offers free cancellation and includes a fitness center.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--12", "ques": "Find a hotel in Paris with a customer review score of 8 or higher, free Wi-Fi, and available for a 5-night stay starting on January 5th, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--13", "ques": "Find and book a hotel in Paris with suitable accommodations for a family of four (two adults and two children) offering free cancellation for the dates of February 14-21, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--14", "ques": "Book a highly-rated hotel with a swimming pool and free WiFi near the Louvre Museum in Paris for the weekend of March 3-5, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--15", "ques": "Find the highest-rated luxury hotel in Rome available for booking from January 10, 2024, to January 20, 2024, for 2 adults. Include the cost, amenities offered, and customer rating.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--16", "ques": "Look for a hotel in Paris with a user rating of 9 or higher and available for a 5-night stay starting January 15, 2024. The hotel should also offer free Wi-Fi and breakfast included in the price. Provide the name, location, and price per night.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--17", "ques": "Find a hotel in Paris with a fitness center and a rating of 8 or higher available for a 5-night stay starting from February 14, 2024, and sort the results by best reviewed.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--18", "ques": "Search a hotel in London with a user rating of 8 or higher for a stay between February 14th, 2024, and February 21st, 2024, suitable for a couple. Provide the name and a short description of the hotel.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--19", "ques": "Look for a hotel with customer ratings above an 8.0 in Paris, France for a weekend stay from March 18, 2024, to March 20, 2024, and list top three suggestions based on user reviews.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--20", "ques": "Locate a hotel in Rome with a good rating (7 or above) that offers free cancellation and breakfast included, for a three-night stay from February 28 to March 2, 2024, for two adults.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--21", "ques": "Find a hotel in Sydney with a rating of 8 or higher, providing free Wi-Fi and parking, available for a four-night stay starting on March 10, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--22", "ques": "Search for a hotel in Amsterdam with a customer review score of 9 or higher, offering bicycle rentals, for a week-long stay from March 15 to March 22, 2024, for two adults.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--23", "ques": "Identify a hotel in Tokyo with a spa and wellness center, rated 9 or above, with availability for a five-night stay starting on February 20, 2024. Check if free cancellation is offered.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--24", "ques": "Find a hotel in Barcelona for a stay from February 25-28, 2024. Please sort the results by distance from the beach and make sure they offer free Wi-Fi and breakfast.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--25", "ques": "Search for a hotel in Lisbon with airport shuttle, rated 8.5 or above, available for a six-night stay from March 1 to March 7, 2024, for two adults, breakfast included.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--26", "ques": "Check Booking.com for a 3-star hotel or higher in Paris with a guest rating above 8.0 and available parking for dates February 20-23, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--27", "ques": "Locate a hotel in Melbourne offering free parking and free WiFi, for a stay from February 28 to March 4, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--28", "ques": "Find a hotel in Dubai with a swimming pool, for a week-long stay from February 22 to February 29, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--29", "ques": "Search for a hotel in Toronto with a fitness center and a rating of 8+, available for a two-night stay from March 5 to March 7, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--30", "ques": "Search for hotels in London from March 20 to March 23, 2024, on Booking. How many hotels are left after applying the Breakfast included and Fitness center filters?", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--31", "ques": "Search for hotels in Rio de Janeiro from March 1-7, 2024, check the Brands filter to see which brand has the most hotels and which brand has the fewest.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--32", "ques": "Look for hotels in Sydney from February 24 to February 27, 2024, on Booking. Once the Swimming Pool and Airport Shuttle filters are applied, what is the total number of hotels available?", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--33", "ques": "Find the Customer Service on the Booking website, browse the questions about cancellation, and tell me 'how do I know whether my booking has been cancelled'.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--34", "ques": "Search for a hotel in Berlin available for a three-night stay from March 15 to March 18, 2024, for one adult. Tell me the price in USD and CNY for the three-night stay.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--35", "ques": "Browse the booking website to get inspiration for your next trip, and summarize at least three places mentioned in one of the travel articles.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--36", "ques": "Search for a budget hotel in Rome under $100 per night for one adult from March 20 to March 23, 2024. Sort the results by price, identify if any of top three results offer breakfast.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--37", "ques": "Search for a resort (not hotel) in Bali, detailing the available dates between March 20, 2024, and March 25, 2024, and checking any provided tour or cultural experiences.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--38", "ques": "Look up Vienna hotel options with availability for a 4-night stay from February 28 to March 4, 2024, with amenities that include a Parking, breakfast included, and a rating of 8+ on Booking.com.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--39", "ques": "Find a pet-friendly hotel with parking available in downtown Toronto for the stay of February 24-26, 2024.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--40", "ques": "I need to choose a hotel in Shenzhen, please select date (6 March to 8 March 2024) and click the search button. How much it costs when convert the price to Chinese Yuan on the page.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--41", "ques": "Browse Booking's homepage to find out which company it belongs to.", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--42", "ques": "Search for a hotel in Hokkaido for the period March 1 to March 7, 2024, with a rating of 9+, check out its user reviews, which categories are greater than 9 and which are less than 9?", "web": "https://www.booking.com/"}
{"web_name": "Booking", "id": "Booking--43", "ques": "Search for properties in Los Angeles, browse the results page to see what filters are available, list some of them.", "web": "https://www.booking.com/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--0", "ques": "Look up the pronunciation and definition of the word \"sustainability\" on the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--1", "ques": "Find the pronunciation, definition, and a sample sentence for the word 'serendipity'.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--2", "ques": "Look up the pronunciation, definition, and example sentence for the word \"ubiquitous\" in UK and US English.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--3", "ques": "Look up the definition, pronunciation, and examples of the word \"zeitgeist.\"", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--4", "ques": "Look for the British English pronunciation of the word \"innovate\" and write down the International Phonetic Alphabet (IPA) notation, then find one example sentence provided in the Cambridge Dictionary that uses this word.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--5", "ques": "Learn the UK and US pronunciation of the word \"procrastination\", and find one example sentence that reflects its use in context.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--6", "ques": "Search for the word \"sustainability\" on the Cambridge Dictionary, what is the translation of sustainability into Chinese and French in the dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--7", "ques": "Look up the meaning, pronunciation, and an example sentence of the word \"gestalt\" using the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--8", "ques": "Find three different meanings of \"dog\" in Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--9", "ques": "Look up the British pronunciation of the word \"euphoria\" and find an example sentence using that word on the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--10", "ques": "Look up the definition and pronunciation of the word \"impeccable\" and also find an example sentence using that word.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--11", "ques": "Look up the pronunciation and definition of the word \"ameliorate,\" and provide an example sentence using the word.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--12", "ques": "Find the pronunciation, definition, and a sample sentence for the word \"resilience\" in the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--13", "ques": "Find one word, one phase and one idiom related to euphoria in Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--14", "ques": "Use the Cambridge Dictionary to find the pronunciation, definition, and one example sentence for the word \"concatenate\".", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--15", "ques": "Find the pronunciation and a sample sentence for the word \"pandemic.\"", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--16", "ques": "Look up the definition of \"cryptocurrency\" on Cambridge Dictionary, provide the pronunciation, and use it in two example sentences that illustrate different contexts.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--17", "ques": "How many meanings of \"unblemished\" are given in Cambridge Dictionary? Please browse the page and give the number directly.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--18", "ques": "Search for \"to behave well\" in Cambridge Dictionary's Thesaurus and see which synonyms the dictionary gives.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--19", "ques": "Try a Cambridge Dictionary translation and tell me which company provided the translation.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--20", "ques": "Look up the definition, pronunciation (both UK and US), and find one example sentence for the word \"altruism\" in the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--21", "ques": "Search for the word \"ephemeral\" on Cambridge Dictionary and find its translation into Spanish.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--22", "ques": "Use the Cambridge Dictionary to find the definition, UK pronunciation, and an example sentence for the word \"quintessential.\"", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--23", "ques": "Find the US English pronunciation of the word \"meticulous\" using the Cambridge Dictionary and note the International Phonetic Alphabet (IPA) notation, then find one example sentence provided in the dictionary using this word.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--24", "ques": "Look up the definition and both UK and US pronunciation of the word \"reverie,\" and provide an example sentence using the word from Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--25", "ques": "Find two different meanings of the word \"harmony\" in the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--26", "ques": "Search for the word \"nostalgia\" in the Cambridge Dictionary and report the translation of this word into Chinese.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--27", "ques": "Look up the meaning, pronunciation, and an example sentence of the word \"solitude\" using the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--28", "ques": "Search for \"feel giddy\" in Cambridge Dictionary's Thesaurus and list the synonyms the dictionary provides.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--29", "ques": "Go to the Plus section of Cambridge Dictionary, find Image quizzes and do an easy quiz about Animals and tell me your final score.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--30", "ques": "Find the grammar for present perfect simple uses in English, including examples of affirmative, negative, and interrogative sentences, on the Cambridge Dictionary website.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--31", "ques": "Look up the use of modal verbs in grammar section for expressing possibility (e.g., 'might', 'could', 'may') and find examples of their usage in sentences on the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--32", "ques": "Search for the differences between \"fewer\" and \"less\" in grammar section, and provide examples illustrating their correct usage from the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--33", "ques": "Find explanations and examples of the passive voice in Grammar on the Cambridge Dictionary website.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--34", "ques": "Use the Cambridge Dictionary to understand the rules for forming and using comparative and superlative adjectives in English Grammar, including example sentences.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--35", "ques": "Find the most common prepositions that consist of groups of words on the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--36", "ques": "Search for guidelines on using indirect speech in English, with examples of how to change direct speech to indirect speech, on the Cambridge Dictionary.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--37", "ques": "Use Cambridge Dictionary to understand the use of articles ('a', 'an', 'the') in English Grammar, including examples of usage with both countable and uncountable nouns.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--38", "ques": "Go to the Plus section of Cambridge Dictionary, finish a recommended Grammar quiz without login and tell me your final score.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--39", "ques": "Try the Word Scramble game in the Plus section, Can you beat the clock by unscrambling the letters to spell the word? (Just try the first example.)", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--40", "ques": "Look up the definition, pronunciation in UK English, and at least one example using the word 'mitigate'.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--41", "ques": "Find and browse Cambridge Dictionary Shop section, listing 3 items.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Cambridge Dictionary", "id": "Cambridge Dictionary--42", "ques": "Convert the Cambridge Dictionary homepage from English (UK) to Deutsch.", "web": "https://dictionary.cambridge.org/"}
{"web_name": "Coursera", "id": "Coursera--0", "ques": "Find a beginner-level online course about '3d printing' which lasts 1-3 months, and is provided by a renowned university.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--1", "ques": "Search for a beginner-level online course about Python programming, suitable for someone who has no programming experience on Coursera.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--2", "ques": "Find a Beginner's Spanish Specialization on Coursera and show all the courses in this Specialization.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--3", "ques": "Identify a new course or Specialization on Coursera related to Python Data Science, sort the courses by newest, what the first course is and which institution offers it.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--4", "ques": "Identify a course or Specialization on Coursera that helps business process management with with a rating 4.7.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--5", "ques": "Identify a Specialization on Coursera that teaches C++ programming for beginners, provide the name and what the learning outcomes are.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--6", "ques": "Identify a course on Coursera related to 'Artificial Intelligence for Healthcare' and note the course duration along with the number of quizzes in Assessments.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--7", "ques": "Find a course on Coursera that teaches Reinforcement Learning for Intermediate with a rating of at least 4.5. Provide the name of the course, the institution offering it, and the number of reviews it has received.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--8", "ques": "Find a free course related to 'R for Data Science' available on Coursera. Scroll to find a course with the Free tag. What language the course is taught in?", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--9", "ques": "Identify a Coursera course on artificial intelligence ethics that has a duration of less than 20 hours to complete and has been rated 4+ stars by participants.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--10", "ques": "Locate an introductory course related to artificial intelligence on Coursera, ensuring it's suitable for beginners and contains at least one module discussing Ethical Considerations.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--11", "ques": "Search for a Specialization on Coursera about project management that is produced by a university, show a testimonial for this Specialization.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--12", "ques": "Look for a Coursera course (not Specialization) that teaches Java programming basics.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--13", "ques": "Look for a Specialization on Coursera that teaches Python programming, and identify the skills you will learn by taking this Specialization.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--14", "ques": "Find a course on Coursera related to Introductory Project Management that includes modules on Agile methodology.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--15", "ques": "Find a course on Coursera named 'Introduction to Mathematical Thinking' offered by Stanford, what is the percentage (rounded) of 5 star ratings in reviews and which level has the least percentage?.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--16", "ques": "Identify a course on Coursera named 'Introduction to Finance: The Basics', who is the course instructor and what other courses does he/she teach.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--17", "ques": "How many results are there for a search on Coursera for Machine Learning, then filtered by Credit Eligible and 1-4 Years duration?", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--18", "ques": "Identify a Coursera course that teaches JavaScript, which is beginner-friendly and includes a certificate upon completion.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--19", "ques": "Identify a course on Coursera that provides an introduction to Psychology, list the instructor's name, the institution offering it, and how many hours it will approximately take to complete.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--20", "ques": "Find an Intermediate-level online course on Coursera about 'Blockchain Technology' which lasts between 1 to 4 weeks, and is provided by a well-known institution. Also, note the course's main goals and the instructor's name.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--21", "ques": "Search for an online course on Coursera about 'Digital Marketing', suitable for beginner-level learners. Specify the course duration, the main learning outcomes, and the institution offering the course.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--22", "ques": "Identify a Specialization on Coursera that focuses on 'Human Resource', list the courses included in this Specialization, and the institution offering it.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--23", "ques": "Find a course on Coursera about 'Artificial Intelligence Ethics', which has a duration of less than 5 weeks and has been rated 4.5 stars or higher. Provide the course name and the instructor's name.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--24", "ques": "Locate an online course on Coursera related to 'Sustainability' that belongs to Physical Science and Engineering subject. The course should include a module on Measuring Sustainability. Note the course duration and the offering institution.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--25", "ques": "Find a course on Coursera about 'Relativity' for beginners. List the course's main topics and the estimated time (in hours) required to complete it.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--26", "ques": "Identify a Specialization on Coursera that offers an overview of 'Renewable Energy'. The Specialization should be beginner-level and include a course on Renewable Energy Futures. Note the instructor's name and the number of weeks required to complete the course if I spend 5 hours a week.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--27", "ques": "Search for a Specialization on Coursera about 'Data Visualization' that includes a project. Provide the name of the Specialization, the institution offering it, and the skills that will be developed by completing it.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--28", "ques": "Locate a Coursera Guided project related to 'Astrophysics' suitable for advanced learners. Mention the course duration, the institution offering it, and the main subjects covered in the course.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--29", "ques": "Browse the Coursera website and find the price required for one year of Coursera Plus. How much is the discount? Then list 3 companies that work with Coursera.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--30", "ques": "Locate the course 'Modern Art & Ideas' on Coursera offered by The Museum of Modern Art. Find out the percentage (rounded) of 3-star ratings in the reviews and note which star level has the lowest percentage.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--31", "ques": "Search for the course 'Exploring Quantum Physics' on Coursera, offered by the University of Maryland, College Park. Identify the percentage (rounded) of 5-star ratings in the reviews.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--32", "ques": "Search for 'Data Analysis' courses on Coursera. Apply filters to find courses that are 'Beginner Level' and have a duration ranging from 1 to 3 months. Determine the total count of courses that match these specifications.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--33", "ques": "Find a beginner level Coursera course related to \"Internet of Things (IoT)\" with a high rating. Provide the course name, instructor's name, and a brief summary of the skills that will be taught.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--34", "ques": "Find the course on Coursera named 'Essentials of Global Health'. Determine the instructor of this course and summarize his bio, note if there are any additional courses he offers on Coursera.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--35", "ques": "Find a Coursera course on Sustainable Agriculture practices, and detail the course's objectives and the background of the lead instructor.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--36", "ques": "Browse Coursera, which universities offer Master of Advanced Study in Engineering degrees? Tell me what is the latest application deadline for this degree?", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--37", "ques": "Browse the Coursera homepage and list at least three free courses.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--38", "ques": "Browse Coursera, which universities and companies from Australia are partners of Coursera? List all of them.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--39", "ques": "Find the Space Safety course offered by TUM on Coursera. How many videos are there in module 2? What is the name of each video?", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--40", "ques": "Browse Coursera for Business and Coursera for Teams and summarise some of their advantages.", "web": "https://www.coursera.org/"}
{"web_name": "Coursera", "id": "Coursera--41", "ques": "Browse online degrees section on Coursera and list 3 Bachelor's degree programmes.", "web": "https://www.coursera.org/"}
{"web_name": "ESPN", "id": "ESPN--0", "ques": "Look up the current standings for the NBA Eastern Conference on ESPN.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--1", "ques": "Check the latest articles on ESPN for updates on any trades that occurred in the NBA within the past 2 days.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--2", "ques": "Show the scores and main highlight of the Milwaukee Bucks game that took place within the last 2 days on ESPN.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--3", "ques": "Retrieve the final score from the most recent NBA game broadcast on ESPN, including the playing teams' names and the date of the match.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--4", "ques": "Check ESPN for the final scores of NBA games that were played yesterday.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--5", "ques": "Identify the top scorer in the NBA from the latest completed game and note down the points scored, the team they play for, and their position on the team.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--6", "ques": "Find the result of the latest basketball game between the Los Angeles Lakers and the Boston Celtics, including the final score and top scorer from the match.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--7", "ques": "Retrieve the final score and a brief summary of the latest NBA game played by the Los Angeles Lakers as reported on ESPN.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--8", "ques": "Find information on ESPN about the top three scoring leaders in the NBA as of the last day of the regular season, and note which teams they play for.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--9", "ques": "Search on ESPN for how many teams have Los Angeles in their name and how many of them are NBA.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--10", "ques": "Check ESPN for the score and a brief recap of the latest college football championship game.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--11", "ques": "How many NBA teams are there and list all the teams with 'New' in their name.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--12", "ques": "The first three Top Headlines in the current ESPN home page correspond to which sports leagues?", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--13", "ques": "Identify today's top headline in the Basketball section of ESPN, and summarize the main points of that article.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--14", "ques": "Find the latest news about NBA trades or player movements on ESPN and report the most recent trade deal OR player acquisition.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--15", "ques": "Check the scores of the NBA games played on December 25, 2023.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--16", "ques": "Check the schedule for the NBA game on December 25, 2023, and provide the teams that are playing and their current standings in their respective conferences.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--17", "ques": "Check out the NBA Basketball Power Index 2023-24 to see which teams are in first place and which are in last place.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--18", "ques": "How many sports leagues can you choose from on the ESPN home page?", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--19", "ques": "Who has the highest salary in Boston Celtics Roster 2023-24?", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--20", "ques": "Look up the current leaders in rebounds and assists in the NBA Western Conference on ESPN.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--21", "ques": "Show the scores and main highlight of the Denver Nuggets game that occurred within the last 3 days on ESPN.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--22", "ques": "Find the latest Team transactions in the NBA within the past week.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--23", "ques": "Find the result of the latest basketball game between the Miami Heat and the New York Knicks, including the final score and top rebounder from the match.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--24", "ques": "Find the final score from the most recent NFL game broadcast on ESPN, including the teams' names and the date of the match.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--25", "ques": "Identify the player with the most assists in the latest NBA game and show me the assists, the team they play for, and their position.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--26", "ques": "Find information on ESPN NBA schedule. Tell me yesterday's matchups in which the loser high was higher than the winner high.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--27", "ques": "Search on ESPN for how many teams have 'Golden' in their name and how many of them are in the NHL.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--28", "ques": "How many MLB teams are there and list all the teams with 'City' in their name.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--29", "ques": "Identify today's top headline in the Soccer section of ESPN, and summarize the main points of that article.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--30", "ques": "Check out the NHL Standings 2023-24 on ESPN to see which teams are at the top and which are at the bottom in Eastern and Western Conference. What about the situation in Division.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--31", "ques": "Who has the heaviest weight among infielders in the New York Yankees Roster 2023-24?", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--32", "ques": "Review yesterday's NHL game results on ESPN, focusing on teams' performance.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--33", "ques": "Locate the latest ESPN articles discussing potential MVP candidates in the NFL for 2023 season.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--34", "ques": "Visit ESPN to view the Philadelphia 76ers' latest injuries.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--35", "ques": "Browse ESPN to find out when the next game of the Los Angeles Lakers will start. Then navigate to the ticket purchasing website from ESPN, what is the cheapest ticket available.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--36", "ques": "Search for Lionel Messi's last 5 games, which teams has he played for, and what are the results?", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--37", "ques": "Check out LeBron James' Stats to see how many games he has played in his career so far.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--38", "ques": "Check Los Angeles Lakers Stats 2023-24, calculate Anthony Davis' games played (GP) percentage, tell me if there are other players with the same games played percentage as Anthony Davis.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--39", "ques": "Check the New York Jets Depth Chart in the NFL section of ESPN and identify the players listed as injured in the 2ND position.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--40", "ques": "Browse the ESPN+ page from ESPN for a brief summary of what ESPN+ Tools is used for.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--41", "ques": "Find out which four teams the NFC North contains in the NFL on ESPN.", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--42", "ques": "Check out NCAAM standings on ESPN, what are the teams with equal wins and losses in the America East Conference currently?", "web": "https://www.espn.com/"}
{"web_name": "ESPN", "id": "ESPN--43", "ques": "Check out NCAAW recruiting on ESPN, what colleges are the top three players from?", "web": "https://www.espn.com/"}
{"web_name": "GitHub", "id": "GitHub--0", "ques": "Search for an open-source project related to 'climate change data visualization' on GitHub and report the project with the most stars.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--1", "ques": "Search for an open-source repository for machine learning in Python, specifically focused on decision trees, updated within the last 2 days.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--2", "ques": "Look for the trending Python repositories on GitHub with most stars.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--3", "ques": "Find out how much more package storage the Enterprise version has over Team in GitHub Pricing.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--4", "ques": "Find a popular JavaScript repository created in the last 30 days on GitHub with a Readme file.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--5", "ques": "Find a Python repository on GitHub that has been updated in the past 2 days and has at least 500 stars.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--6", "ques": "Search for an open-source project related to 'cryptocurrency wallet' updated in the past 30 days and provide the top three contributors.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--7", "ques": "Find the official GitHub repository for ALBERT and show me what files the repo changed in the most recent commit.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--8", "ques": "Look up the latest stable release version of Vuex and find out when it was published.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--9", "ques": "Locate a repository on GitHub that was created in the last week and has 50 or more stars. Provide brief details about the project's purpose and its programming language.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--10", "ques": "If I start using Copilot Individual, how much US dollars will it cost per year and what features does it have?", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--11", "ques": "Find a newly created open-source project on GitHub related to 'climate change' that has been initiated in January 2023; check the main programming language used and the project's description.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--12", "ques": "Retrieve the latest release from the 'electron/electron' repository on GitHub and note down the release version number and date.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--13", "ques": "Identify the latest top-trending open-source project in the category of 'Machine Learning' on GitHub, and check the number of stars it has received.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--14", "ques": "Locate the repository for the open-source project \"vscode\" and identify the top three contributors.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--15", "ques": "Locate a repository on GitHub related to 'quantum computing' that has been updated within the last week and has at least 50 stars. Provide a brief description of the project.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--16", "ques": "Find the GitHub Skill section and how many courses are under the 'First day on GitHub' heading.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--17", "ques": "Locate a C++ project on GitHub that has been recently updated in the last week and has at least 500 stars, then describe its main purpose.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--18", "ques": "Identify and report the most popular (in terms of stars) open-source image processing tool on GitHub.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--19", "ques": "Look up the most recently updated Python repository on GitHub that is tagged with 'web scraping' and has over 100 stars.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--20", "ques": "Open GitHub Copilot's FAQs to find the official answer to when Copilot chat can be used on mobile.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--21", "ques": "Find the Security topic in GitHub Resources and answer the role of GitHub Advanced Security.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--22", "ques": "Find an open-source repository on GitHub focused on natural language processing in Ruby, updated within the last week.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--23", "ques": "Find the wiki page of ohmyzsh on GitHub and tell me how to change the theme of zsh to agnoster.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--24", "ques": "Locate the GitHub repository for the open-source project \"angular\" and identify the last three issues closed.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--25", "ques": "Search for a 'virtual reality' related repository on GitHub updated in the last 10 days with at least 200 stars and summarize its main objective.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--26", "ques": "Find the Resolve merge conflicts course in GitHub Skills and what actions learners will perform in this course.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--27", "ques": "Find a Ruby repository on GitHub that has been updated in the past 3 days and has at least 1000 stars.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--28", "ques": "Identify the most starred JavaScript repositories on GitHub that were created after 2023-12-29.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--29", "ques": "Compare the maximum number of private repositories allowed in the Free and Pro plans in GitHub Pricing.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--30", "ques": "Search for an open-source project related to 'blockchain technology' on GitHub updated in the past 15 days and list the top five contributors.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--31", "ques": "Find the official GitHub repository for TensorFlow and list the files changed in the last commit. Tell me the name of changed files, total additions and total deletion.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--32", "ques": "Discover the latest C# repository on GitHub related to 'game development' and having over 150 stars, and describe its main features.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--33", "ques": "Find Customer Stories on the GitHub page and list the 2 stories that appear on the web page.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--34", "ques": "Search for an open-source project on GitHub related to 'Protein prediction' and identify the project with the highest number of forks.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--35", "ques": "Check the latest release version of React and the date it was published on GitHub.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--36", "ques": "Identify a new open-source project on GitHub related to 'AI agriculture' that created in 2022, and note its main programming language and description.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--37", "ques": "List the 3 features mentioned in GitHub's Copilot product page.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--38", "ques": "Identify and report the most popular (by stars) open-source repo related to cybersecurity on GitHub.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--39", "ques": "Browse the GitHub Trending and find out which developer is currently ranked first this month and the corresponding repository.", "web": "https://github.com/"}
{"web_name": "GitHub", "id": "GitHub--40", "ques": "Select Sign up on the GitHub homepage to see if email 'test123@gmail.com' already exists.", "web": "https://github.com/"}
{"web_name": "Google Flights", "id": "Google Flights--0", "ques": "Book a journey with return option on same day from Edinburg to Manchester on December 28th and show me the lowest price option available.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--1", "ques": "Show me the list of one-way flights today (February 17, 2024) from Chicago to Paris.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--2", "ques": "Find the lowest fare from all eligible one-way flights for 1 adult from JFK to Heathrow on Jan. 22.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--3", "ques": "Search for the one-way flight available from Calgary to New York on Jan. 1st with the lowest carbon dioxide emissions.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--4", "ques": "Search for one-way flights from New York to London on Dec. 26th and filter the results to show only non-stop flights.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--5", "ques": "Find flights from Chicago to London on 20 December and return on 23 December.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--6", "ques": "Search for a flight on December 19 and return on December 26 from Tel Aviv to Venice and Select First Class.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--7", "ques": "Find a round trip from Phoenix to Miami (Dec. 25th - Dec. 28th), show the First Class plane tickets for me that do not exceed $1320..", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--8", "ques": "Search a one-way filght from Dublin To Athens Greece for 1 Adult that leaves on December 30 and analyse the price graph for the next 2 months.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--9", "ques": "Find a one way economy flight from Pune to New York in Jan. 15th and show me how long it will take for flight transfer.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--10", "ques": "Locate the cheapest round-trip flights from New York to Tokyo leaving on January 25, 2024, and returning on February 15, 2024.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--11", "ques": "Compare the prices for round-trip flights from New York to Tokyo for a departure on February 10, 2024, and a return on February 24, 2024, and select the option with the least number of stops.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--12", "ques": "Find the best-priced round-trip flight from New York to London leaving on December 25, 2023, and returning on January 5, 2024, with one stop or fewer.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--13", "ques": "Find the cheapest round-trip flight option from New York City to Tokyo for a departure on January 10, 2024, and a return on January 24, 2024.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--14", "ques": "Compare flight options and find the lowest round trip fare from New York to London departing on January 10, 2024, and returning on January 17, 2024.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--15", "ques": "Compare the prices and total duration of non-stop flights from New York to Tokyo Narita Airport departing on February 12th, 2024, and returning on February 26th, 2024.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--16", "ques": "Find the cheapest one-way flight from New York to Tokyo departing on January 15, 2024, and provide the airline and total flight duration.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--17", "ques": "Find the cheapest round-trip flight from New York to Paris leaving on December 27, 2023, and returning on January 10, 2024.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--18", "ques": "Compare flight options from New York to Tokyo for a round trip leaving on January 25, 2024, and returning on February 15, 2024, for one adult. Prioritize the comparisons by the shortest travel time.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--19", "ques": "Find the cheapest one-way flight from London to Paris, departing on January 25, 2024. Include the airline, total travel time, and layovers for the chosen flight.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--20", "ques": "Book a round-trip flight from San Francisco to Berlin, departing on March 5, 2024, and returning on March 12, 2024, and find the option with the shortest total travel time.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--21", "ques": "Locate the lowest-priced one-way flight from Tokyo to Sydney for an adult, departing on February 25, 2024, and include the flight duration and number of layovers.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--22", "ques": "Find a round-trip flight from Rio de Janeiro to Los Angeles, leaving on March 15, 2024, and returning on March 22, 2024, and select the option with the least carbon dioxide emissions.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--23", "ques": "Search for a one-way flight from Mumbai to Vancouver on February 28, 2024, filtering the results to show only 1-stop flights.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--24", "ques": "Compare prices for economy class round-trip flights from Dubai to Rome, departing on March 1, 2024, and returning on March 8, 2024, and select the option with the fewest stops.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--25", "ques": "Find a one-way business class flight from Buenos Aires to Amsterdam on March 10, 2024, and provide the details of the flight with the shortest duration.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--26", "ques": "Search for the cheapest round-trip flights from Bangkok to Madrid, leaving on February 26, 2024, and returning on February 28, 2024, and provide options under $1000.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--27", "ques": "Locate a one-way flight from Johannesburg to Toronto on March 30, 2024, for one adult, and analyze the price trends for the following month.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--28", "ques": "Find the best-priced round-trip flight from Seattle to Paris, departing on February 27, 2024, and returning on March 1, 2024, with a maximum of one stop.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--29", "ques": "Compare the prices and total travel time of non-stop flights from Mexico City to Frankfurt, departing on March 5, 2024, and returning on March 15, 2024.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--30", "ques": "Find the most affordable one-way flight from Cape Town to Singapore, departing on March 20, 2024, and include the airline and total number of layovers.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--31", "ques": "Find a one-way economy flight from Auckland to Honolulu on March 25, 2024, browse the full page and display a flight option with the most stops.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--32", "ques": "Search for round-trip flights from Stockholm to Toronto, departing on March 3, 2024, and returning on March 10, 2024, and sort the results to find the shortest total travel time.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--33", "ques": "Find a one-way flight from Shanghai to Vancouver on February 27, 2024, and compare the options based on carbon dioxide emissions.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--34", "ques": "Compare business class flight options from Lisbon to Singapore for a one-way trip on March 15, 2024, select one of the flights and see which websites offer its booking options. Which one is the cheapest.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--35", "ques": "Find the lowest-priced one-way flight from Cairo to Montreal on February 21, 2024, including the total travel time and number of stops.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--36", "ques": "Search for round-trip flights from Helsinki to New Delhi, departing on March 28, 2024, and returning on April 4, 2024, and filter the results to show only flights under $1000.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--37", "ques": "Locate a round-trip flight from Buenos Aires to Beijing, leaving on February 28, 2024, and returning on March 3, 2024, check out one of the options and tell me if the airline for my return flight is the same as my departure flight.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--38", "ques": "Compare the prices and flight durations for economy class flights from Oslo to Dubai, departing on March 8, 2024, and show the options with no more than two layovers.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--39", "ques": "Find a one-way flight from Prague to a city in Japan on March 20, 2024, which city in Japan is cheaper to go to, Tokyo or a certain city in Hokkaido?", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--40", "ques": "Browse destinations on the Google Flights homepage from Seattle, look at destinations on a map, and recommend some famous places to travel that are within a reasonable distance and price.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Flights", "id": "Google Flights--41", "ques": "Choose one way business class ticket from Hong Kong to Glacier National Park on 8 March 2024, offering a 1 stop ticket.", "web": "https://www.google.com/travel/flights/"}
{"web_name": "Google Map", "id": "Google Map--0", "ques": "Find 5 beauty salons with ratings greater than 4.8 in Seattle, WA.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--1", "ques": "Tell me one bus stop that is nearest to the intersection of main street and Amherst street in Altavista.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--2", "ques": "Find Apple Stores close to zip code 90028", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--3", "ques": "The least amount of walking from Central Park Zoo to the Broadway Theater in New York.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--4", "ques": "Plan a trip from Boston Logan Airport to North Station.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--5", "ques": "Search for a parking garage near Thalia Hall in Chicago that isn't open 24 hours.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--6", "ques": "Find all Uniqlo locations in Chicago, IL.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--7", "ques": "Find bus stops in Alanson, MI", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--8", "ques": "Find a place to climb within 2 miles of zip code 90028.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--9", "ques": "Find the art gallery that is nearest to Los Angeles Hindu Temple.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--10", "ques": "Search for a park in the state of California called Castle Mountains National Monument and find out it's Basic Information.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--11", "ques": "Locate a large store in Washington that has kids' and maternity products, also check if it has a parking lot.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--12", "ques": "Find 5 places that serve burgers near 44012 zip code and sort these 5 places by highest rating.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--13", "ques": "Find a parking lot in Gloucester and book a ride from there to North Plymouth, view the map to understand the route better.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--14", "ques": "Find motorcycle parking near Radio City Music Hall.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--15", "ques": "Find daytime only parking nearest to Madison Square Garden. Summarize what people are saying about it. ", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--16", "ques": "Find EV charging supported parking closest to Smithsonian museum.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--17", "ques": "Search for locksmiths open now but not open 24 hours in Texas City.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--18", "ques": "Find a route between Chicago to Los Angeles, then print the route details.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--19", "ques": "I will arrive Pittsburgh Airport soon. Provide the name of the Hilton hotel closest to the airport. Then, tell me the the walking time to the nearest supermarket from the hotel.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--20", "ques": "Find Tesla Destination Charger closest to the National Air and Space Museum.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--21", "ques": "Identify the nearest bus stop to the corner of Elm Street and Oak Street in Massachusetts.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--22", "ques": "Find a Best Buy store near zip code 33139.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--23", "ques": "Determine the shortest walking route from The Metropolitan Museum of Art to Times Square in New York.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--24", "ques": "Plan a journey from San Francisco International Airport to Union Square via driving.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--25", "ques": "Search for a parking facility near the Fox Theater in Detroit that closes at night.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--26", "ques": "Search for Los Angeles on Google Map, try to print the map as PDF and summarize the information on the map.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--27", "ques": "Locate the Target stores in Atlanta, GA. How many results are shown on the map.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--28", "ques": "Find the search settings for Google Map, what options are shown on that page?", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--29", "ques": "Identify bus stops in Ypsilanti, MI, list three of them.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--30", "ques": "Locate a parking lot near the Brooklyn Bridge that open 24 hours. Review the user comments about it.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--31", "ques": "First search New York's Central Park Zoo on Google Map, and then find the way to share the map. What is the generated sharing link?", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--32", "ques": "Search for plumbers available now but not open 24 hours in Orlando, FL.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--33", "ques": "Check out Denver International Airport's information and tell me: 1) which level has the least proportion in reviews; 2) what are its Accessibility and Amenities.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--34", "ques": "Find a hiking trail within 2 miles of zip code 80202.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--35", "ques": "Search for a natural reserve in Texas called Big Bend National Park and gather its Basic Information.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--36", "ques": "Identify 5 restaurants serving pizza near the 30309 zip code and rank them by their ratings.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--37", "ques": "Locate a parking area in Salem and find a route from there to Marblehead, including map directions for better understanding.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--38", "ques": "Search for bicycle parking near the Empire State Building.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--39", "ques": "Find a route from Miami to New Orleans, and provide the detailed route information.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Map", "id": "Google Map--40", "ques": "Find a restaurant in Boston that eats Boston lobster and asks for a rating of 4.6 or higher, and check out what a one-star review says.", "web": "https://www.google.com/maps/"}
{"web_name": "Google Search", "id": "Google Search--0", "ques": "Find the initial release date for Guardians of the Galaxy Vol. 3 the movie.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--1", "ques": "Find Kevin Durant's bio", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--2", "ques": "Search for the latest news title about the NBA team the Los Angeles Lakers.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--3", "ques": "Show me a list of comedy movies, sorted by user ratings. Show me the Top 5 movies.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--4", "ques": "Show most played games in Steam. And tell me the number of players in In game at this time", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--5", "ques": "find the score of the latest nba game played by the phoenix suns.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--6", "ques": "Browse the monthly trending searches in Columbus.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--7", "ques": "Find the software requirements for iPhones that support AirDrop's ability to continue transmitting over the web when out of range.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--8", "ques": "Find the video on YouTube: 'Oscars 2023: Must-See Moments!'. Tell me who the first comment displayed under that video belongs to, and how many thumbs up and replies it has.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--9", "ques": "Show the rating of Prometheus movie on IMDb and Rotten Tomatoes.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--10", "ques": "Find the no. 1 weekly charts ranked artist based on Billboard and tell me 10 most played song by this artist until now.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--11", "ques": "According to FlightAware, tell me the busiest airport last week and its total arrivals and departures last week.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--12", "ques": "Find the year that Tom Brady had the most touchdowns in a single seasson.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--13", "ques": "What are Jerry Trainor's upcoming projects?", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--14", "ques": "Find the retired players the year before last named James Smith and tell me which club he has been a member of from 2020\u20132021.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--15", "ques": "Please try to log in to twitter with email: webagenttest@testmail.com and password: test123456. Let me know if the login was successful.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--16", "ques": "How many members are there in the OpenAI community on Reddit, and what is the hottest news right now?", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--17", "ques": "Tell me the names of Trump's kids", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--18", "ques": "When and where the most recent World Cup was held, and which team was the winner?", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--19", "ques": "What are the first 7 bits of the SHA of the Bert's latest commit on GitHub, and what exactly was changed in that commit.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--20", "ques": "Find the release date for the latest \"Fast & Furious\" movie.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--21", "ques": "Show a list of the top 5 highest-grossing animated movies, sorted by box office earnings.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--22", "ques": "Browse and list the top three trending topics this month in New York City.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--23", "ques": "Retrieve a short biography of LeBron James.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--24", "ques": "What is the name of the star system closest to the Solar System, and what are the discovered planets in it?", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--25", "ques": "Get the latest news headline about the English Premier League football club Manchester United.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--26", "ques": "Identify the hardware requirements for using the latest version of Adobe Photoshop on a Mac.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--27", "ques": "Check the current air quality index in Paris.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--28", "ques": "Check the IMDb and Metacritic scores of the movie \"Inception.\"", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--29", "ques": "Find out the current world record for the men's 100m sprint.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--30", "ques": "Find the current number one artist on the Spotify Global Top 50 chart and list his/her top 10 songs as of now.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--31", "ques": "Discover which year Cristiano Ronaldo scored the most goals in a single season.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--32", "ques": "Find out where and when the most recent UEFA Champions League final was held, and which team won.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--33", "ques": "Find and copy the SHA of the latest commit in the TensorFlow repository on GitHub, then find a textbox to paste and tell me what the SHA is.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--34", "ques": "Determine the distance from Earth to Mars as of today's date.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--35", "ques": "Look up the latest research paper related to black holes published in the journal \"Nature Astronomy\".", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--36", "ques": "Search for the most recent Nobel Prize winner in Physics and their contribution to the field.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--37", "ques": "Find the current top 3 super-earth planets and give a brief introduction to them.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--38", "ques": "Search for the next visible solar eclipse in North America and its expected date, and what about the one after that.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--39", "ques": "Identify the top-10 trending travel destination for 2024 through a blog, how many of them are in Asian.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--40", "ques": "Look up the elevation of Mount Kilimanjaro on Google Search.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--41", "ques": "Look up the current statistics of air pollution level in Los Angeles using Google Search.", "web": "https://www.google.com/"}
{"web_name": "Google Search", "id": "Google Search--42", "ques": " Use Google Search to find an article that explains the major differences between American English and British English.", "web": "https://www.google.com/"}
{"web_name": "Huggingface", "id": "Huggingface--0", "ques": "Find a pre-trained natural language processing model on Hugging Face that can perform sentiment analysis, and make sure the model's last update is within March 2023.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--1", "ques": "Use the Huggingface Inference API to generate a short story about a dragon and a wizard.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--2", "ques": "Discover three new and popular open-source NLP models for language translation released in the past month on Huggingface.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--3", "ques": "Look up a model with a license of cc-by-sa-4.0 with the most likes on Hugging face.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--4", "ques": "Locate an open-source conversational AI model on Hugging Face, trained in English and list its main features and applications.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--5", "ques": "Find a model released on Hugging Face for recipe generation. Retrieve the information of the model, including its name, model size and tensor type.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--6", "ques": "Find the model sentence-transformers/all-MiniLM-L6-v2 and use the Inference API on the webpage to get the similarity of the following two sentences: 'Tomorrow is Sunday', 'Eat a burger on Sunday'.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--7", "ques": "Which is the most downloaded audio related dataset on Hugging face currently.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--8", "ques": "Retrieve an example of a pre-trained language model in natural language processing and identify the tasks it is specifically designed for, like translation or text summarization.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--9", "ques": "Find the most download machine translation model on Huggingface which focuses on English and Japanese (en-ja) and report the evaluation metrics stated for it.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--10", "ques": "Open space: argilla/notux-chat-ui and interact with it by asking it 'which team trained you'. What is its answer.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--11", "ques": "Identify the latest updated image to video model available on Huggingface and summarize its main features.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--12", "ques": "Find the most recently updated machine learning model on Huggingface which focuses on Error Correction.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--13", "ques": "Search for LLaMA in the huggingface doc, what type is the spaces_between_special_tokens parameter in LlamaTokenizer and what is its default value.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--14", "ques": "How much is the Pro account of Hugging face for a month and what are the features?", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--15", "ques": "Identify the most downloaded models on Hugging face that use the PaddlePaddle library.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--16", "ques": "Find information on the latest (as of today's date) pre-trained language model on Huggingface suitable for text classification and briefly describe its intended use case and architecture.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--17", "ques": "Find the most recently updated open-source project related to natural language processing on the Huggingface platform. Provide the project's name, creator, and a brief description of its functionality.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--18", "ques": "Look up TRL's forward modelling in the hugging face documentation on how to add a margin to a loss.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--19", "ques": "Explore and summarize the features of the most recent open-source NLP model released by Hugging Face for English text summarization.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--20", "ques": "Locate a pre-trained natural language processing model on Hugging Face that specializes in named entity recognition (NER), confirm that the model was last updated in 2022 and has 1M+ downloads.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--21", "ques": "Look up the tour about how to use the 'pipeline' feature in the Hugging Face Transformers library for sentiment analysis, and identify the default model it uses.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--22", "ques": "Identify the steps to convert a PyTorch model to TensorFlow using the Hugging Face Transformers library as described in their documentation.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--23", "ques": "Identify three innovative and widely recognized open-source NLP models for automatic speech recognition released in the past month on Huggingface.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--24", "ques": "Search for a model on Hugging Face with an Apache-2.0 license that has received the highest number of likes.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--25", "ques": "In the Hugging Face documentation, find the tutorial on loading adapters with PEFT, tell me how to load in 8bit or 4bit.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--26", "ques": "Identify a model on Hugging Face designed for generating travel chats. Obtain information about the model, including its name, size and training framwork.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--27", "ques": "Determine the most downloaded dataset related to Text Retrieval in NLP on Hugging Face.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--28", "ques": "Retrieve an example of a pre-trained model on Hugging Face that is optimized for question answering tasks and detail the languages it supports.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--29", "ques": "Summarize the description of the recent open-source NLP model released on Hugging Face for medical summarization.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--30", "ques": "Identify the most downloaded English-Chinese (en-zh) machine translation model on Huggingface and report its latest performance metrics and usage guidelines.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--31", "ques": "Identify the latest machine learning model on Huggingface that specializes in detecting fake news, including the date of its last update.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--32", "ques": "On the Hugging Face website, search for the model 'GPT-J-6B' and find the 'temperature' parameter in its settings. What is the default value of this parameter?", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--33", "ques": "List three hugging face docs. How many GitHub stars have they earned so far?", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--34", "ques": "List the benefits of hugging face classroom mentioned on Hugging face website.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--35", "ques": "Find the latest Diffusion-related blog on Hugging Face, and read its intro or overview section to roughly summarize the content of the blog.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--36", "ques": "Summarize all the payment plans and their advantages in huggingface pricing.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--37", "ques": "Browse the daily paper on Hugging Face. What is the title of the first article, how many upvotes has it received, and is there any related model or data release?", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--38", "ques": "Investigate the 'transformers' library in the Hugging Face documentation, focusing on how to add new tokens to a tokenizer.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--39", "ques": "Investigate in the Hugging Face documentation how to utilize the 'Trainer' API for training a model on a custom dataset, and note the configurable parameters of the Trainer class.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--40", "ques": "Check out Text Embeddings Inference in Hugging face's Doc to summarise the strengths of the toolkit.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--41", "ques": "What is the current Text-to-3D model with the highest number of downloads and tell me are there Spaces that use the model.", "web": "https://huggingface.co/"}
{"web_name": "Huggingface", "id": "Huggingface--42", "ques": "Check the Dataset Viewer for ai2lumos/lumos_complex_qa_plan_onetime on Hugging face. what is the content corresponding to user in the first message?", "web": "https://huggingface.co/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--0", "ques": "derivative of x^2 when x=5.6", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--1", "ques": "Give a constraint on the set of inequalities for the inner region of the pentagram.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--2", "ques": "Calculate 3^71 and retain 5 significant figures in scientific notation.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--3", "ques": "Let g(x) be the integral of x^2 cos(2x). Write the expression of g(x).", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--4", "ques": "Pack 24 circles in a circle radius r. Compare Densest known packing and Square packing. Then tell me the radius of the inner circles.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--5", "ques": "Show the solution of y\"(z) + sin(y(z)) = 0 from wolframalpha.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--6", "ques": "Simplify x^5-20x^4+163x^3-676x^2+1424x-1209 so that it has fewer items.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--7", "ques": "Give the final angle and final length after 6s of a Spring pendulum with spring equilibrium length=0.12m, initial length=0.24m, initial angle=80deg, mass=1kg, spring constant=120 N/m .", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--8", "ques": "Give 12 lbs of 4-cyanoindole, converted to molar and indicate the percentage of C, H, N.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--9", "ques": "Annual energy production of Diablo Canyon 2 in 2010.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--10", "ques": "Give the geomagnetic field on June 20, 2023 in Oslo.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--11", "ques": "Show the electrical resistivity of UNS A92024 and UNS G10800 at 20 degrees Celsius.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--12", "ques": "Which character in unicode 8900 to 8920 looks like a snowflake", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--13", "ques": "What is 10,000 US dollars worth now in 1980 and in 1970?", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--14", "ques": "Compare the total Calories: whopper vs baconator vs big mac. Assume that each serving of food is 300g.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--15", "ques": "Show the blood relationship fraction between you and your father's mother's sister's son.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--16", "ques": "Weight lose for a male with current weight 90 kg, 40 year old, 175 cm. If he intakes 1500 calories every day, how long will it take to lose 17 kg.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--17", "ques": "Show the average price of movie ticket in Providence, Nashville, Boise in 2023.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--18", "ques": "Plot Albert Einstein curve with Parametric equations.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--19", "ques": "Standing in the sun from 11:00 am with SPF 5 in Australia. Approximate time to sunburn for each skin type.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--20", "ques": "Compute the integral of 3e^(2x) from x=0 to x=5.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--21", "ques": "Calculate (1+0.1*i)^8 + (1\u22120.2*i)^8  where i is a complex number.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--22", "ques": "Determine the area of a regular hexagon with a side length of 7 cm.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--23", "ques": "Calculate the population growth rate of Canada from 2020 to 2023 using Wolfram Alpha.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--24", "ques": "Solve the differential equation y''(t) - 2y'(t) + 10y(t) = 0 and display its general solution.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--25", "ques": "Calculate the final position and velocity of a projectile launched at 45 degrees with an initial speed of 30 m/s after 3 seconds.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--26", "ques": "Convert 15 kilograms of sulfuric acid to moles and display the percentage composition of H, S, and O by weight.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--27", "ques": "Display the thermal conductivity of Copper (Cu) and Aluminum (Al) at 25 degrees Celsius.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--28", "ques": "Identify the character in Unicode range 9632 to 9650 that represents a hollow parallelogram.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--29", "ques": "Create a plot of cat curve using wolfram alpha.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--30", "ques": "Calculate the estimated time to sunburn for different skin types when exposed to the sun at 1:00 pm with SPF 1 in Brazil.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--31", "ques": "Using Wolfram Alpha, determine the current temperature and wind speed in Chicago, IL.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--32", "ques": "Print all prime numbers between 1000 and 1200 using Wolfram alpha.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--33", "ques": "Identify the electrical energy output of a hydroelectric power plant named Itaipu Dam in 2023 using Wolfram Alpha.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--34", "ques": "Calculate the mass of Jupiter compared to Earth using Wolfram Alpha. Also, find the length of one day on Jupiter.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--35", "ques": "Calculate the determinant of a 6x6 Hilbert matrix.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--36", "ques": "Determine the convergence or divergence of the series \u03a3 (n=1 to \u221e) of 1/(n^3 + 1).", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--37", "ques": "How many days are there between February 12, 2024 and August 9, 2050?", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--38", "ques": "Compute the length of a curve defined by y = 2x^3 - 3x^2 + 4x - 5 from x = 0 to x = 3.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--39", "ques": "Use Wolfram alpha to write the expression of the ellipse x^2 + 3 y^2 = 4 rotated 33 degrees counterclockwise.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--40", "ques": "Approximate amount of fat burned by a 28yo, 172cm tall, 70kg woman running for 30min at a pace of 6min/mile.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--41", "ques": "What is the approximate Heart Rate Reserve of a 50 year old man who has a heart rate of 60bpm at rest.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--42", "ques": "What is the raw memory of a 100.2\" * 123.5\" true colour picture at 72 ppi?", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--43", "ques": "A polyominoes of order 6 means you have 6 identical squares to combine different shapes (2-sided). How many combinations are there? Looking at all the shapes in the result, how many of them have only 2 rows in total?", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--44", "ques": "Solve the ODE, g' + cos(g) = 0, if there is a constant in the result, determine the value of the constant by the condition that g(0) = 1.", "web": "https://www.wolframalpha.com/"}
{"web_name": "Wolfram Alpha", "id": "Wolfram Alpha--45", "ques": "A 175cm tall, 85kg, 40yo man climbs 2500 steps at about 18cm per step and 40 steps per minute. summarise the Metabolic properties.", "web": "https://www.wolframalpha.com/"}

================================================
FILE: packages/evals/env.ts
================================================
/**
 * Determine the current environment in which the evaluations are running:
 * - BROWSERBASE or LOCAL
 *
 * The environment is read from the EVAL_ENV environment variable.
 */
export const env: "BROWSERBASE" | "LOCAL" =
  process.env.EVAL_ENV?.toLowerCase() === "browserbase"
    ? "BROWSERBASE"
    : "LOCAL";


================================================
FILE: packages/evals/evals.config.json
================================================
{
  "defaults": {
    "env": "local",
    "trials": 3,
    "concurrency": 10,
    "provider": null,
    "model": null,
    "api": false
  },
  "benchmarks": {
    "webbench": {
      "limit": 25,
      "filters": ["difficulty", "category", "use_hitl"]
    },
    "gaia": {
      "limit": 25,
      "filters": ["level"]
    },
    "webvoyager": {
      "limit": 25
    },
    "osworld": {
      "limit": 25,
      "filters": ["source", "evaluation_type"],
      "timeout": 60000
    },
    "onlineMind2Web": {
      "limit": 25
    },
    "webtailbench": {
      "limit": 25
    }
  },
  "tasks": [
    {
      "name": "history",
      "categories": ["combination"]
    },
    {
      "name": "extract_repo_name",
      "categories": ["extract"]
    },
    {
      "name": "amazon_add_to_cart",
      "categories": ["act"]
    },
    {
      "name": "instructions",
      "categories": ["regression", "combination"]
    },
    {
      "name": "bidnet",
      "categories": ["act"]
    },
    {
      "name": "ionwave",
      "categories": ["act", "regression"]
    },
    {
      "name": "nonsense_action",
      "categories": ["act"]
    },
    {
      "name": "peeler_simple",
      "categories": ["act"]
    },
    {
      "name": "simple_google_search",
      "categories": ["act"]
    },
    {
      "name": "vantechjournal",
      "categories": ["act"]
    },
    {
      "name": "wikipedia",
      "categories": ["act"]
    },
    {
      "name": "allrecipes",
      "categories": ["combination"]
    },
    {
      "name": "arxiv",
      "categories": ["combination"]
    },
    {
      "name": "extract_collaborators",
      "categories": ["combination"]
    },
    {
      "name": "extract_github_commits",
      "categories": ["combination"]
    },
    {
      "name": "imdb_movie_details",
      "categories": ["combination"]
    },
    {
      "name": "peeler_complex",
      "categories": ["combination"]
    },
    {
      "name": "sciquest",
      "categories": ["combination"]
    },
    {
      "name": "wichita",
      "categories": ["combination", "regression"]
    },
    {
      "name": "hn_aisdk",
      "categories": ["llm_clients"]
    },
    {
      "name": "hn_langchain",
      "categories": ["llm_clients"]
    },
    {
      "name": "hn_customOpenAI",
      "categories": ["llm_clients"]
    },
    {
      "name": "apple",
      "categories": ["experimental"]
    },
    {
      "name": "combination_sauce",
      "categories": ["experimental"]
    },
    {
      "name": "costar",
      "categories": ["experimental"]
    },
    {
      "name": "extract_aigrant_companies",
      "categories": ["regression"]
    },
    {
      "name": "extract_capacitor_info",
      "categories": ["experimental"]
    },
    {
      "name": "extract_partners",
      "categories": ["experimental"]
    },
    {
      "name": "extract_press_releases",
      "categories": ["experimental"]
    },
    {
      "name": "extract_snowshoeing_destinations",
      "categories": ["experimental"]
    },
    {
      "name": "homedepot",
      "categories": ["experimental"]
    },
    {
      "name": "rakuten_jp",
      "categories": ["experimental"]
    },
    {
      "name": "stock_x",
      "categories": ["experimental"]
    },
    {
      "name": "ted_talk",
      "categories": ["experimental"]
    },
    {
      "name": "extract_baptist_health",
      "categories": ["extract"]
    },
    {
      "name": "extract_github_stars",
      "categories": ["extract"]
    },
    {
      "name": "extract_memorial_healthcare",
      "categories": ["extract", "regression"]
    },
    {
      "name": "extract_nhl_stats",
      "categories": ["extract"]
    },
    {
      "name": "extract_professional_info",
      "categories": ["extract"]
    },
    {
      "name": "extract_csa",
      "categories": ["extract"]
    },
    {
      "name": "extract_resistor_info",
      "categories": ["extract"]
    },
    {
      "name": "extract_rockauto",
      "categories": ["extract"]
    },
    {
      "name": "extract_staff_members",
      "categories": ["extract"]
    },
    {
      "name": "ionwave_observe",
      "categories": ["observe"]
    },
    {
      "name": "panamcs",
      "categories": ["observe"]
    },
    {
      "name": "vanta_h",
      "categories": ["experimental"]
    },
    {
      "name": "extract_area_codes",
      "categories": ["extract"]
    },
    {
      "name": "extract_public_notices",
      "categories": ["extract"]
    },
    {
      "name": "extract_jstor_news",
      "categories": ["extract"]
    },
    {
      "name": "extract_apartments",
      "categories": ["extract"]
    },
    {
      "name": "extract_zillow",
      "categories": ["extract"]
    },
    {
      "name": "observe_github",
      "categories": ["observe", "regression"]
    },
    {
      "name": "observe_vantechjournal",
      "categories": ["observe", "regression"]
    },
    {
      "name": "observe_amazon_add_to_cart",
      "categories": ["observe"]
    },
    {
      "name": "observe_simple_google_search",
      "categories": ["observe"]
    },
    {
      "name": "observe_yc_startup",
      "categories": ["observe"]
    },
    {
      "name": "observe_taxes",
      "categories": ["observe"]
    },
    {
      "name": "observe_iframes1",
      "categories": ["regression", "observe"]
    },
    {
      "name": "observe_iframes2",
      "categories": ["regression", "observe"]
    },
    {
      "name": "extract_hamilton_weather",
      "categories": ["targeted_extract", "regression"]
    },
    {
      "name": "extract_regulations_table",
      "categories": ["targeted_extract"]
    },
    {
      "name": "extract_recipe",
      "categories": ["targeted_extract"]
    },
    {
      "name": "extract_aigrant_targeted",
      "categories": ["targeted_extract"]
    },
    {
      "name": "extract_aigrant_targeted_2",
      "categories": ["targeted_extract"]
    },
    {
      "name": "extract_geniusee",
      "categories": ["targeted_extract"]
    },
    {
      "name": "extract_geniusee_2",
      "categories": ["targeted_extract"]
    },
    {
      "name": "scroll_50",
      "categories": ["regression", "act"]
    },
    {
      "name": "scroll_75",
      "categories": ["regression", "act"]
    },
    {
      "name": "next_chunk",
      "categories": ["regression", "act"]
    },
    {
      "name": "prev_chunk",
      "categories": ["regression", "act"]
    },
    {
      "name": "google_flights",
      "categories": ["act"]
    },
    {
      "name": "extract_jfk_links",
      "categories": ["extract"]
    },
    {
      "name": "extract_single_link",
      "categories": ["extract"]
    },
    {
      "name": "dropdown",
      "categories": ["act"]
    },
    {
      "name": "radio_btn",
      "categories": ["act"]
    },
    {
      "name": "checkboxes",
      "categories": ["act"]
    },
    {
      "name": "agent/iframe_form",
      "categories": ["agent"]
    },
    {
      "name": "agent/iframe_form_multiple",
      "categories": ["agent"]
    },
    {
      "name": "agent/google_flights",
      "categories": ["agent"]
    },
    {
      "name": "agent/github_react_version",
      "categories": ["agent"]
    },
    {
      "name": "agent/steam_games",
      "categories": ["agent"]
    },
    {
      "name": "agent/ubereats",
      "categories": ["agent"]
    },
    {
      "name": "agent/kith",
      "categories": ["agent"]
    },
    {
      "name": "agent/apple_tv",
      "categories": ["agent"]
    },
    {
      "name": "agent/apple_trade_in",
      "categories": ["agent"]
    },
    {
      "name": "agent/arxiv_gpt_report",
      "categories": ["agent"]
    },
    {
      "name": "agent/sf_library_card",
      "categories": ["agent"]
    },
    {
      "name": "agent/sf_library_card_multiple",
      "categories": ["agent"]
    },
    {
      "name": "agent/hugging_face",
      "categories": ["agent"]
    },
    {
      "name": "agent/google_maps_3",
      "categories": ["agent"]
    },
    {
      "name": "login",
      "categories": ["act", "regression"]
    },
    {
      "name": "iframe_hn",
      "categories": ["extract"]
    },
    {
      "name": "iframe_same_proc",
      "categories": ["act"]
    },
    {
      "name": "iframe_form_filling",
      "categories": ["act"]
    },
    {
      "name": "iframes_nested",
      "categories": ["act"]
    },
    {
      "name": "no_js_click",
      "categories": ["act", "regression"]
    },
    {
      "name": "tab_handling",
      "categories": ["act"]
    },
    {
      "name": "agent/kayak",
      "categories": ["agent"]
    },
    {
      "name": "multi_tab",
      "categories": ["act"]
    },
    {
      "name": "shadow_dom",
      "categories": ["act"]
    },
    {
      "name": "os_dropdown",
      "categories": ["act"]
    },
    {
      "name": "custom_dropdown",
      "categories": ["act"]
    },
    {
      "name": "hidden_input_dropdown",
      "categories": ["act"]
    },
    {
      "name": "nested_iframes_2",
      "categories": ["act"]
    },
    {
      "name": "heal_scroll_50",
      "categories": ["act"]
    },
    {
      "name": "heal_simple_google_search",
      "categories": ["regression", "act"]
    },
    {
      "name": "heal_custom_dropdown",
      "categories": ["act"]
    },
    {
      "name": "agent/trivago",
      "categories": ["agent"]
    },
    {
      "name": "agent/google_maps",
      "categories": ["agent"]
    },
    {
      "name": "agent/google_maps_2",
      "categories": ["agent"]
    },
    {
      "name": "agent/sign_in",
      "categories": ["agent"]
    },
    {
      "name": "osr_in_oopif",
      "categories": ["act"]
    },
    {
      "name": "csr_in_oopif",
      "categories": ["act"]
    },
    {
      "name": "csr_in_spif",
      "categories": ["act"]
    },
    {
      "name": "csr_in_spif",
      "categories": ["act"]
    },
    {
      "name": "spif_in_osr",
      "categories": ["act"]
    },
    {
      "name": "oopif_in_osr",
      "categories": ["act"]
    },
    {
      "name": "spif_in_csr",
      "categories": ["act"]
    },
    {
      "name": "oopif_in_csr",
      "categories": ["act"]
    },
    {
      "name": "osr_in_spif",
      "categories": ["act"]
    },
    {
      "name": "namespace_xpath",
      "categories": ["act"]
    },
    {
      "name": "iframe_scroll",
      "categories": ["act"]
    },
    {
      "name": "agent/gaia",
      "categories": ["external_agent_benchmarks"]
    },
    {
      "name": "agent/webvoyager",
      "categories": ["external_agent_benchmarks"]
    },
    {
      "name": "agent/nba_trades",
      "categories": ["agent"]
    },
    {
      "name": "agent/hotel_booking",
      "categories": ["agent"]
    },
    {
      "name": "agent/github",
      "categories": ["agent"]
    },
    {
      "name": "agent/all_recipes",
      "categories": ["agent"]
    },
    {
      "name": "agent/onlineMind2Web",
      "categories": ["external_agent_benchmarks"]
    },
    {
      "name": "agent/webtailbench",
      "categories": ["external_agent_benchmarks"]
    },
    {
      "name": "agent/alibaba_supplier_search",
      "categories": ["agent"]
    },
    {
      "name": "agent/amazon_shoes_cart",
      "categories": ["agent"]
    },
    {
      "name": "agent/columbia_tuition",
      "categories": ["agent"]
    },
    {
      "name": "agent/flipkart_laptops",
      "categories": ["agent"]
    },
    {
      "name": "agent/google_shopping",
      "categories": ["agent"]
    },
    {
      "name": "agent/hotels_paris_amenities",
      "categories": ["agent"]
    },
    {
      "name": "agent/instacart_organic_bananas",
      "categories": ["agent"]
    },
    {
      "name": "agent/kfc_tenders_combo",
      "categories": ["agent"]
    },
    {
      "name": "agent/made_in_china_supplier",
      "categories": ["agent"]
    },
    {
      "name": "agent/nvidia_hgx_driver",
      "categories": ["agent"]
    },
    {
      "name": "agent/oed_word_search",
      "categories": ["agent"]
    },
    {
      "name": "agent/radiotimes_tv_schedule",
      "categories": ["agent"]
    },
    {
      "name": "agent/redfin_apartment_rental",
      "categories": ["agent"]
    },
    {
      "name": "agent/thegamer_opinion_article",
      "categories": ["agent"]
    },
    {
      "name": "agent/trailhead_superbadge",
      "categories": ["agent"]
    },
    {
      "name": "agent/trustpilot_hr_companies",
      "categories": ["agent"]
    },
    {
      "name": "agent/uniqlo_mens_blazers",
      "categories": ["agent"]
    },
    {
      "name": "agent/webmd_audiologist_search",
      "categories": ["agent"]
    },
    {
      "name": "agent/webmd_ovulation_calculator",
      "categories": ["agent"]
    }
  ]
}


================================================
FILE: packages/evals/index.eval.ts
================================================
/**
 * This script orchestrates the running of evaluations against a set of tasks.
 * It uses Braintrust to run multiple testcases (each testcase representing a
 * given task-model combination) and then aggregates the results, producing
 * a summary of passes, failures, and categorized success rates.
 *
 * Overview:
 * - Reads a configuration file `evals.config.json` to determine what tasks (evaluations)
 *   are available and which categories they belong to.
 * - Supports filtering which tasks to run either by evaluation category or by specific task name.
 * - Supports multiple models, defaulting to certain sets of models depending on the category.
 * - Runs each selected task against each selected model in parallel, collecting results.
 * - Saves a summary of the evaluation results to `../../eval-summary.json`.
 */
import fs from "node:fs";
import path from "node:path";
import process from "node:process";
import { pathToFileURL } from "node:url";
import {
  DEFAULT_EVAL_CATEGORIES,
  filterByCategory,
  filterByEvalName,
} from "./args.js";
import { generateExperimentName } from "./utils.js";
import { exactMatch, errorMatch } from "./scoring.js";
import {
  tasksByName,
  tasksConfig,
  getModelList,
  getAgentModelEntries,
} from "./taskConfig.js";
import { Eval } from "braintrust";
import { SummaryResult, Testcase, EvalInput } from "./types/evals.js";
import { EvalLogger } from "./logger.js";
import {
  AvailableModel,
  LLMClient,
  StagehandEvalError,
  AgentProvider,
  loadApiKeyFromEnv,
  LogLine,
  getAISDKLanguageModel,
} from "@browserbasehq/stagehand";
import { AISdkClientWrapped } from "./lib/AISdkClientWrapped.js";
import { env } from "./env.js";
import { initV3 } from "./initV3.js";
import { generateSummary } from "./summary.js";
import { buildGAIATestcases } from "./suites/gaia.js";
import { buildWebVoyagerTestcases } from "./suites/webvoyager.js";
import { buildOnlineMind2WebTestcases } from "./suites/onlineMind2Web.js";
import { endBrowserbaseSession } from "./browserbaseCleanup.js";
import { buildWebTailBenchTestcases } from "./suites/webtailbench.js";
import { getCurrentDirPath } from "./runtimePaths.js";

import dotenv from "dotenv";
dotenv.config();

const moduleDir = getCurrentDirPath();

/**
 * Read max concurrency and trial count from environment variables set in args.ts.
 * Fallback to defaults (20 and 5) if they're not provided.
 */
const MAX_CONCURRENCY = process.env.EVAL_MAX_CONCURRENCY
  ? parseInt(process.env.EVAL_MAX_CONCURRENCY, 10)
  : 3;

const TRIAL_COUNT = process.env.EVAL_TRIAL_COUNT
  ? parseInt(process.env.EVAL_TRIAL_COUNT, 10)
  : 3;

const USE_API: boolean = (process.env.USE_API ?? "").toLowerCase() === "true";
console.log(`[EVALS] USE_API: ${USE_API}`);

/**
 * generateFilteredTestcases:
 * Based on the chosen filters (category or specific eval name) and environment,
 * this function generates the set of testcases to run. Each testcase is a combination
 * of a task and a model.
 *
 * Steps:
 * - Dynamically determine the list of models based on filters.
 * - Start with all combinations of tasks (from `tasksByName`) and the determined models.
 * - Filter by category if a category filter was specified.
 * - Filter by evaluation name if specified.
 * - In the BROWSERBASE environment, exclude certain tasks that are not suitable.
 */
const generateFilteredTestcases = (): Testcase[] => {
  let taskNamesToRun: string[];
  let effectiveCategory: string | null = filterByCategory; // Start with the command-line filter

  if (filterByEvalName) {
    // If a specific task name is given, that's the only one we run
    taskNamesToRun = [filterByEvalName];
    // Check if this single task belongs to agent-related categories to override models
    const taskCategories = tasksByName[filterByEvalName]?.categories || [];
    if (
      taskCategories.length === 1 &&
      (taskCategories[0] === "agent" ||
        taskCategories[0] === "external_agent_benchmarks")
    ) {
      // Treat this run as an agent category run for model selection
      effectiveCategory = taskCategories[0];
      console.log(
        `Task ${filterByEvalName} is in ${taskCategories[0]} category, using agent models.`,
      );
    }
  } else if (filterByCategory) {
    // If filtering by category, get all tasks in that category
    taskNamesToRun = Object.keys(tasksByName).filter((name) =>
      tasksByName[name].categories.includes(filterByCategory!),
    );
  } else {
    // If no specific task or category filter, run tasks from default categories
    taskNamesToRun = Object.keys(tasksByName).filter((name) =>
      DEFAULT_EVAL_CATEGORIES.some((category) =>
        tasksByName[name].categories.includes(category),
      ),
    );
  }

  // Dynamically determine the MODELS based on the effective category
  const currentModels = getModelList(effectiveCategory);

  console.log(
    `Using models for this run (${effectiveCategory || "default"}):`,
    currentModels,
  );

  // Check for dataset filter from environment
  const datasetFilter = process.env.EVAL_DATASET;

  // Special handling: fan out GAIA dataset for agent/gaia
  const isGAIATaskIncluded = taskNamesToRun.includes("agent/gaia");
  // Special handling: fan out WebVoyager dataset for agent/webvoyager
  const isWebVoyagerTaskIncluded = taskNamesToRun.includes("agent/webvoyager");
  // Special handling: fan out Mind2Web dataset for agent/onlineMind2Web
  const isMind2WebTaskIncluded = taskNamesToRun.includes(
    "agent/onlineMind2Web",
  );

  let allTestcases: Testcase[] = [];

  // Only include GAIA if no dataset filter or if gaia is selected
  if (isGAIATaskIncluded && (!datasetFilter || datasetFilter === "gaia")) {
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/gaia");
    allTestcases.push(...buildGAIATestcases(currentModels));
  } else if (isGAIATaskIncluded && datasetFilter && datasetFilter !== "gaia") {
    // Remove GAIA from tasks to run if dataset filter excludes it
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/gaia");
  }

  // Only include WebVoyager if no dataset filter or if webvoyager is selected
  if (
    isWebVoyagerTaskIncluded &&
    (!datasetFilter || datasetFilter === "webvoyager")
  ) {
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/webvoyager");
    allTestcases.push(...buildWebVoyagerTestcases(currentModels));
  } else if (
    isWebVoyagerTaskIncluded &&
    datasetFilter &&
    datasetFilter !== "webvoyager"
  ) {
    // Remove WebVoyager from tasks to run if dataset filter excludes it
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/webvoyager");
  }

  // Only include Mind2Web if no dataset filter or if onlineMind2Web is selected
  if (
    isMind2WebTaskIncluded &&
    (!datasetFilter || datasetFilter === "onlineMind2Web")
  ) {
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/onlineMind2Web");
    allTestcases.push(...buildOnlineMind2WebTestcases(currentModels));
  } else if (
    isMind2WebTaskIncluded &&
    datasetFilter &&
    datasetFilter !== "onlineMind2Web"
  ) {
    // Remove Mind2Web from tasks to run if dataset filter excludes it
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/onlineMind2Web");
  }

  // Special handling: fan out WebTailBench dataset for agent/webtailbench
  const isWebTailBenchTaskIncluded =
    taskNamesToRun.includes("agent/webtailbench");

  if (
    isWebTailBenchTaskIncluded &&
    (!datasetFilter || datasetFilter === "webtailbench")
  ) {
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/webtailbench");
    allTestcases.push(...buildWebTailBenchTestcases(currentModels));
  } else if (
    isWebTailBenchTaskIncluded &&
    datasetFilter &&
    datasetFilter !== "webtailbench"
  ) {
    taskNamesToRun = taskNamesToRun.filter((t) => t !== "agent/webtailbench");
  }

  // Create a list of all remaining testcases using the determined task names and models
  const isAgentCategory =
    effectiveCategory === "agent" ||
    effectiveCategory === "external_agent_benchmarks";

  // Use agent model entries (with cua flag) for agent categories, otherwise map currentModels
  const modelEntries = isAgentCategory
    ? getAgentModelEntries()
    : currentModels.map((m) => ({ modelName: m, cua: false }));

  const regularTestcases = modelEntries.flatMap((entry) =>
    taskNamesToRun.map((testName) => ({
      input: {
        name: testName,
        modelName: entry.modelName as AvailableModel,
        ...(isAgentCategory && { isCUA: entry.cua }),
      },
      name: testName,
      tags: [
        entry.modelName,
        ...(isAgentCategory ? [entry.cua ? "cua" : "agent"] : []),
        testName,
        ...(tasksConfig.find((t) => t.name === testName)?.categories || []).map(
          (x) => `category/${x}`,
        ),
      ],
      metadata: {
        model: entry.modelName as AvailableModel,
        test: testName,
      },
      expected: true,
    })),
  );

  allTestcases = [...allTestcases, ...regularTestcases];

  // This filtering step might now be redundant if taskNamesToRun is already filtered
  if (filterByCategory) {
    allTestcases = allTestcases.filter((testcase) =>
      tasksByName[testcase.name].categories.includes(filterByCategory!),
    );
  }

  // If running in BROWSERBASE environment, exclude tasks that are not applicable.
  if (env === "BROWSERBASE") {
    allTestcases = allTestcases.filter(
      (testcase) => !["peeler_simple", "stock_x"].includes(testcase.name),
    );
  }

  console.log(
    "Final test cases to run:",
    allTestcases
      .map(
        (t, i) =>
          `${i}: ${t.name} (${t.input.modelName}): ${tasksByName[t.name].categories}`,
      )
      .join("\n"),
  );

  return allTestcases;
};

/**
 * Main execution block:
 * - Determine experiment name
 * - Determine the project name (braintrustProjectName) based on CI or dev environment
 * - Run the Eval function with the given configuration:
 *    * experimentName: A label for this run
 *    * data: A function that returns the testcases to run
 *    * task: A function that executes each task, given input specifying model and task name
 *    * scores: An array of scoring functions
 *    * maxConcurrency: Limit on parallel tasks
 *    * trialCount: Number of trials (retries) per task
 * - Collect and summarize results using `generateSummary`.
 */
(async () => {
  // Generate a unique name for the experiment
  const experimentName: string = generateExperimentName({
    evalName: filterByEvalName || undefined,
    category: filterByCategory || undefined,
    environment: env,
  });

  // Determine braintrust project name to use (stagehand in CI, stagehand-dev otherwise)
  const braintrustProjectName =
    process.env.CI === "true" ? "stagehand" : "stagehand-dev";

  try {
    // Run the evaluations with the braintrust Eval function
    const evalResult = await Eval(braintrustProjectName, {
      experimentName,
      data: generateFilteredTestcases,
      // Each test is a function that runs the corresponding task module
      task: async (input: EvalInput) => {
        const logger = new EvalLogger();
        // Track V3 instance at outer scope to ensure cleanup in all cases
        let v3Input: Awaited<ReturnType<typeof initV3>> | undefined;
        let v3ToClose: Awaited<ReturnType<typeof initV3>>["v3"] | null = null;

        try {
          const taskBasePath = path.join(moduleDir, "tasks", input.name);
          const taskCandidates = [`${taskBasePath}.js`, `${taskBasePath}.ts`];
          const taskModulePath = taskCandidates.find((candidate) =>
            fs.existsSync(candidate),
          );

          if (!taskModulePath) {
            throw new StagehandEvalError(
              `Failed to find task module for ${input.name}. Tried paths:\n` +
                taskCandidates.map((candidate) => `- ${candidate}`).join("\n"),
            );
          }

          const taskModule = await import(pathToFileURL(taskModulePath).href);

          // Extract the task function
          const taskName = input.name.includes("/")
            ? input.name.split("/").pop() // Get the last part of the path for nested tasks
            : input.name;

          const taskFunction = taskModule[taskName];

          if (typeof taskFunction !== "function") {
            throw new StagehandEvalError(
              `No Eval function found for task name: ${taskName} in module ${input.name}`,
            );
          }

          // Execute the task
          const isAgentTask =
            input.name.startsWith("agent/") || input.name.includes("/agent/");
          if (USE_API) {
            // Derive provider from model. Prefer explicit "provider/model"; otherwise infer for agent models
            let provider: string;
            if (input.modelName.includes("/")) {
              provider = input.modelName.split("/")[0];
            } else {
              // Fall back to agent provider inference for bare agent model names (e.g., "computer-use-preview")
              try {
                provider = AgentProvider.getAgentProvider(input.modelName);
              } catch {
                // If not an agent model, leave provider undefined to trigger helpful error below
                provider = undefined as unknown as string;
              }
            }

            const logFn = (line: LogLine): void => logger.log(line);
            const apiKey = loadApiKeyFromEnv(provider, logFn);

            if (!apiKey) {
              throw new StagehandEvalError(
                `USE_API=true but no API key found for provider “${provider}”.`,
              );
            }

            // taskInput = await initStagehand({
            //   logger,
            //   modelName: input.modelName,
            //   modelClientOptions: { apiKey: apiKey },
            // });
            // Also initialize V3 so tasks can migrate to it progressively
            v3Input = await initV3({
              logger,
              modelName: input.modelName,
              modelClientOptions: { apiKey: apiKey },
              createAgent: isAgentTask,
              isCUA: input.isCUA,
            });
            v3ToClose = v3Input.v3;
          } else {
            let llmClient: LLMClient;
            if (input.modelName.includes("/")) {
              const firstSlashIndex = input.modelName.indexOf("/");
              llmClient = new AISdkClientWrapped({
                model: getAISDKLanguageModel(
                  input.modelName.substring(0, firstSlashIndex),
                  input.modelName.substring(firstSlashIndex + 1),
                ),
              });
            }
            v3Input = await initV3({
              logger,
              llmClient,
              modelName: input.modelName,
              createAgent: isAgentTask,
              isCUA: input.isCUA,
            });
            v3ToClose = v3Input.v3;
          }
          // Pass full EvalInput to the task (data-driven params available via input.params)
          const result = await taskFunction({ ...v3Input, input });

          // Log result to console
          if (result && result._success) {
            console.log(`✅ ${input.name}: Passed`);
          } else {
            console.log(`❌ ${input.name}: Failed`);
          }

          return result;
        } catch (error) {
          // Log any errors that occur during task execution
          console.error(`❌ ${input.name}: Error - ${error}`);
          logger.error({
            message: `Error in task ${input.name}`,
            level: 0,
            auxiliary: {
              error: {
                value: error.message,
                type: "string",
              },
              trace: {
                value: error.stack,
                type: "string",
              },
            },
          });
          return {
            _success: false,
            error: JSON.parse(JSON.stringify(error, null, 2)),
            logs: logger.getLogs(),
          };
        } finally {
          // Always close V3 instance, regardless of success or failure.
          // This ensures proper cleanup even if the task threw an error or
          // the Browserbase session disconnected mid-execution.
          if (v3Input?.v3) {
            try {
              await v3Input.v3.close();
            } catch (closeError) {
              // Log but don't throw - we don't want close errors to mask
              // the original task result or prevent subsequent evals
              console.error(
                `Warning: Error closing V3 instance for ${input.name}:`,
                closeError,
              );
            }
          }
          await endBrowserbaseSession(v3ToClose);
          // Clear logger to free memory (logs already captured in result)
          logger.clear();
        }
      },
      // Use the scoring functions defined above
      scores: [exactMatch, errorMatch],
      maxConcurrency: MAX_CONCURRENCY,
      trialCount: TRIAL_COUNT,
    });

    // Map results to the SummaryResult format
    const summaryResults: SummaryResult[] = evalResult.results.map((result) => {
      const output =
        typeof result.output === "boolean"
          ? { _success: result.output }
          : result.output;

      return {
        input: result.input,
        output,
        name: result.input.name,
        score: output._success ? 1 : 0,
      };
    });

    // Generate and write the summary
    await generateSummary(summaryResults, experimentName);
  } catch (error) {
    console.error("Error during evaluation run:", error);
    process.exit(1);
  }
})();


================================================
FILE: packages/evals/initV3.ts
================================================
/**
 * Initializes a V3 instance for use in evaluations without modifying
 * the existing Stagehand-based init flow. Tasks can gradually migrate
 * to consume `v3` directly.
 */

import type {
  AvailableCuaModel,
  AvailableModel,
  AgentInstance,
  ClientOptions,
  LLMClient,
  LocalBrowserLaunchOptions,
  ModelConfiguration,
  V3Options,
  AgentModelConfig,
} from "@browserbasehq/stagehand";
import {
  loadApiKeyFromEnv,
  modelToAgentProviderMap,
  V3,
} from "@browserbasehq/stagehand";
import { env } from "./env.js";
import { EvalLogger } from "./logger.js";

type InitV3Args = {
  llmClient?: LLMClient;
  modelClientOptions?: ClientOptions;
  domSettleTimeoutMs?: number; // retained for parity; v3 handlers accept timeouts per-call
  logger: EvalLogger;
  createAgent?: boolean; // only create an agent for agent tasks
  isCUA?: boolean;
  configOverrides?: {
    localBrowserLaunchOptions?: Partial<
      Pick<LocalBrowserLaunchOptions, "headless" | "args">
    >;
    // Back-compat alias for args
    chromeFlags?: string[];
    browserbaseSessionCreateParams?: V3Options["browserbaseSessionCreateParams"];
    browserbaseSessionID?: V3Options["browserbaseSessionID"];
    experimental?: boolean;
  };
  actTimeoutMs?: number; // retained for parity (v3 agent tools don't use this globally)
  modelName: AvailableModel;
};

export type V3InitResult = {
  v3: V3;
  logger: EvalLogger;
  debugUrl?: string; // not exposed by v3; placeholder for parity
  sessionUrl?: string; // not exposed by v3; placeholder for parity
  modelName: AvailableModel;
  agent?: AgentInstance;
};

export async function initV3({
  llmClient,
  modelClientOptions,
  logger,
  configOverrides,
  modelName,
  createAgent,
  isCUA,
}: InitV3Args): Promise<V3InitResult> {
  // If CUA, choose a safe internal AISDK model for V3 handlers based on available API keys
  let internalModel: AvailableModel = modelName;
  if (isCUA) {
    if (process.env.OPENAI_API_KEY)
      internalModel = "openai/gpt-4.1-mini" as AvailableModel;
    else if (
      process.env.GEMINI_API_KEY ||
      process.env.GOOGLE_GENERATIVE_AI_API_KEY
    )
      internalModel = "google/gemini-2.0-flash" as AvailableModel;
    else if (process.env.ANTHROPIC_API_KEY)
      internalModel = "anthropic/claude-sonnet-4-6" as AvailableModel;
    else
      throw new Error(
        "V3 init: No AISDK API key found. Set one of OPENAI_API_KEY, GEMINI_API_KEY/GOOGLE_GENERATIVE_AI_API_KEY, or ANTHROPIC_API_KEY to run CUA evals.",
      );
  }

  const resolvedModelConfig: ModelConfiguration =
    !isCUA && modelClientOptions
      ? ({
          ...modelClientOptions,
          modelName: internalModel,
        } as ModelConfiguration)
      : internalModel;

  const v3Options: V3Options = {
    env,
    apiKey: process.env.BROWSERBASE_API_KEY,
    projectId: process.env.BROWSERBASE_PROJECT_ID,
    localBrowserLaunchOptions: {
      headless: configOverrides?.localBrowserLaunchOptions?.headless ?? false,
      args:
        configOverrides?.localBrowserLaunchOptions?.args ??
        configOverrides?.chromeFlags,
    },
    model: resolvedModelConfig,
    experimental:
      typeof configOverrides?.experimental === "boolean"
        ? configOverrides.experimental && process.env.USE_API !== "true" // experimental only when not using API
        : false,
    verbose: 2,
    browserbaseSessionCreateParams:
      configOverrides?.browserbaseSessionCreateParams,
    browserbaseSessionID: configOverrides?.browserbaseSessionID,
    selfHeal: true,
    disablePino: true,
    disableAPI: process.env.USE_API !== "true", // Negate: USE_API=true → disableAPI=false
    serverCache: false,
    logger: logger.log.bind(logger),
  };

  if (!isCUA && llmClient) {
    v3Options.llmClient = llmClient;
  }

  const v3 = new V3(v3Options);

  // Associate the logger with the V3 instance
  logger.init(v3);
  await v3.init();

  let agent: AgentInstance | undefined;
  if (createAgent) {
    if (isCUA) {
      const shortModelName = modelName.includes("/")
        ? modelName.split("/")[1]
        : modelName;

      const providerType = modelToAgentProviderMap[shortModelName];
      if (!providerType) {
        throw new Error(
          `CUA model "${shortModelName}" not found in modelToAgentProviderMap. ` +
            `Available: ${Object.keys(modelToAgentProviderMap).join(", ")}`,
        );
      }

      const apiKey = loadApiKeyFromEnv(providerType, logger.log.bind(logger));

      const cuaModel: AvailableCuaModel | AgentModelConfig<AvailableCuaModel> =
        apiKey && apiKey.length > 0
          ? {
              modelName: modelName as AvailableCuaModel,
              apiKey,
            }
          : (modelName as AvailableCuaModel);

      agent = v3.agent({
        cua: true,
        model: cuaModel,
        systemPrompt: `You are a helpful assistant that must solve the task by browsing. At the end, produce a single line: "Final Answer: <answer>" summarizing the requested result (e.g., score, list, or text). ALWAYS OPERATE WITHIN THE PAGE OPENED BY THE USER, YOU WILL ALWAYS BE PROVIDED WITH AN OPENED PAGE, WHICHEVER TASK YOU ARE ATTEMPTING TO COMPLETE CAN BE ACCOMPLISHED WITHIN THE PAGE. Simple perform the task provided, do not overthink or overdo it. The user trusts you to complete the task without any additional instructions, or answering any questions.`,
      });
    } else {
      agent = v3.agent({
        model: modelName,
        executionModel: "google/gemini-2.5-flash",
      });
    }
  }

  return {
    v3,
    logger,
    debugUrl: "",
    sessionUrl: "",
    modelName,
    agent,
  };
}


================================================
FILE: packages/evals/lib/AISdkClientWrapped.ts
================================================
import {
  CoreAssistantMessage,
  ModelMessage,
  CoreSystemMessage,
  CoreUserMessage,
  ImagePart,
  NoObjectGeneratedError,
  TextPart,
  ToolSet,
  Tool,
} from "ai";
import * as ai from "ai";
import { wrapAISDK } from "braintrust";
import type { LanguageModelV2 } from "@ai-sdk/provider";
import { ChatCompletion } from "openai/resources";
import {
  AvailableModel,
  CreateChatCompletionOptions,
  LLMClient,
  LogLine,
  toJsonSchema,
} from "@browserbasehq/stagehand";

// Wrap AI SDK functions with Braintrust for tracing
const { generateObject, generateText } = wrapAISDK(ai);

export class AISdkClientWrapped extends LLMClient {
  public type = "aisdk" as const;
  private model: LanguageModelV2;
  private logger?: (message: LogLine) => void;

  constructor({
    model,
    logger,
  }: {
    model: LanguageModelV2;
    logger?: (message: LogLine) => void;
  }) {
    super(model.modelId as AvailableModel);
    this.model = model;
    this.logger = logger;
  }

  public getLanguageModel(): LanguageModelV2 {
    return this.model;
  }

  async createChatCompletion<T = ChatCompletion>({
    options,
  }: CreateChatCompletionOptions): Promise<T> {
    this.logger?.({
      category: "aisdk",
      message: "creating chat completion",
      level: 2,
      auxiliary: {
        options: {
          value: JSON.stringify({
            ...options,
            image: undefined,
            messages: options.messages.map((msg) => ({
              ...msg,
              content: Array.isArray(msg.content)
                ? msg.content.map((c) =>
                    "image_url" in c
                      ? { ...c, image_url: { url: "[IMAGE_REDACTED]" } }
                      : c,
                  )
                : msg.content,
            })),
          }),
          type: "object",
        },
        modelName: {
          value: this.model.modelId,
          type: "string",
        },
      },
    });

    const formattedMessages: ModelMessage[] = options.messages.map(
      (message) => {
        if (Array.isArray(message.content)) {
          if (message.role === "system") {
            const systemMessage: CoreSystemMessage = {
              role: "system",
              content: message.content
                .map((c) => ("text" in c ? c.text : ""))
                .join("\n"),
            };
            return systemMessage;
          }

          const contentParts = message.content.map((content) => {
            if ("image_url" in content) {
              const imageContent: ImagePart = {
                type: "image",
                image: content.image_url.url,
              };
              return imageContent;
            } else {
              const textContent: TextPart = {
                type: "text",
                text: content.text,
              };
              return textContent;
            }
          });

          if (message.role === "user") {
            const userMessage: CoreUserMessage = {
              role: "user",
              content: contentParts,
            };
            return userMessage;
          } else {
            const textOnlyParts = contentParts.map((part) => ({
              type: "text" as const,
              text: part.type === "image" ? "[Image]" : part.text,
            }));
            const assistantMessage: CoreAssistantMessage = {
              role: "assistant",
              content: textOnlyParts,
            };
            return assistantMessage;
          }
        }

        return {
          role: message.role,
          content: message.content,
        };
      },
    );

    let objectResponse: Awaited<ReturnType<typeof generateObject>>;
    const isGPT5 = this.model.modelId.includes("gpt-5");
    const isCodex = this.model.modelId.includes("codex");
    const usesLowReasoningEffort =
      (this.model.modelId.includes("gpt-5.1") ||
        this.model.modelId.includes("gpt-5.2")) &&
      !isCodex;
    const isDeepSeek = this.model.modelId.includes("deepseek");
    // Kimi models only support temperature=1
    const isKimi = this.model.modelId.includes("kimi");
    const temperature = isKimi ? 1 : options.temperature;
    if (options.response_model) {
      if (isDeepSeek || isKimi) {
        const parsedSchema = JSON.stringify(
          toJsonSchema(options.response_model.schema),
        );

        formattedMessages.push({
          role: "user",
          content: `Respond in this zod schema format:\n${parsedSchema}\n
You must respond in JSON format. respond WITH JSON. Do not include any other text, formatting or markdown in your output. Do not include \`\`\` or \`\`\`json in your response. Only the JSON object itself.`,
        });
      }

      try {
        objectResponse = await generateObject({
          model: this.model,
          messages: formattedMessages,
          schema: options.response_model.schema,
          temperature,
          providerOptions: isGPT5
            ? {
                openai: {
                  textVerbosity: isCodex ? "medium" : "low", // codex models only support 'medium'
                  reasoningEffort: isCodex
                    ? "medium"
                    : usesLowReasoningEffort
                      ? "low"
                      : "minimal",
                },
              }
            : undefined,
        });
      } catch (err) {
        if (NoObjectGeneratedError.isInstance(err)) {
          this.logger?.({
            category: "AISDK error",
            message: err.message,
            level: 0,
            auxiliary: {
              cause: {
                value: JSON.stringify(err.cause ?? {}),
                type: "object",
              },
              text: {
                value: err.text ?? "",
                type: "string",
              },
              response: {
                value: JSON.stringify(err.response ?? {}),
                type: "object",
              },
              usage: {
                value: JSON.stringify(err.usage ?? {}),
                type: "object",
              },
              finishReason: {
                value: err.finishReason ?? "unknown",
                type: "string",
              },
              requestId: {
                value: options.requestId,
                type: "string",
              },
            },
          });

          throw err;
        }
        throw err;
      }

      const result = {
        data: objectResponse.object,
        usage: {
          prompt_tokens: objectResponse.usage.inputTokens ?? 0,
          completion_tokens: objectResponse.usage.outputTokens ?? 0,
          reasoning_tokens: objectResponse.usage.reasoningTokens ?? 0,
          cached_input_tokens: objectResponse.usage.cachedInputTokens ?? 0,
          total_tokens: objectResponse.usage.totalTokens ?? 0,
        },
      } as T;

      this.logger?.({
        category: "aisdk",
        message: "response",
        level: 1,
        auxiliary: {
          response: {
            value: JSON.stringify({
              object: objectResponse.object,
              usage: objectResponse.usage,
              finishReason: objectResponse.finishReason,
              // Omit request and response properties that might contain images
            }),
            type: "object",
          },
          requestId: {
            value: options.requestId,
            type: "string",
          },
        },
      });

      return result;
    }

    const tools: ToolSet = {};
    if (options.tools && options.tools.length > 0) {
      for (const tool of options.tools) {
        tools[tool.name] = {
          description: tool.description,
          inputSchema: tool.parameters,
        } as Tool;
      }
    }

    const textResponse = await generateText({
      model: this.model,
      messages: formattedMessages,
      tools: Object.keys(tools).length > 0 ? tools : undefined,
      toolChoice:
        Object.keys(tools).length > 0
          ? options.tool_choice === "required"
            ? "required"
            : options.tool_choice === "none"
              ? "none"
              : "auto"
          : undefined,
      temperature,
    });

    // Transform AI SDK response to match LLMResponse format expected by operator handler
    const transformedToolCalls = (textResponse.toolCalls || []).map(
      (toolCall) => ({
        id:
          toolCall.toolCallId ||
          `call_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`,
        type: "function",
        function: {
          name: toolCall.toolName,
          arguments: JSON.stringify(toolCall.input),
        },
      }),
    );

    const result = {
      id: `chatcmpl_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`,
      object: "chat.completion",
      created: Math.floor(Date.now() / 1000),
      model: this.model.modelId,
      choices: [
        {
          index: 0,
          message: {
            role: "assistant",
            content: textResponse.text || null,
            tool_calls: transformedToolCalls,
          },
          finish_reason: textResponse.finishReason || "stop",
        },
      ],
      usage: {
        prompt_tokens: textResponse.usage.inputTokens ?? 0,
        completion_tokens: textResponse.usage.outputTokens ?? 0,
        reasoning_tokens: textResponse.usage.reasoningTokens ?? 0,
        cached_input_tokens: textResponse.usage.cachedInputTokens ?? 0,
        total_tokens: textResponse.usage.totalTokens ?? 0,
      },
    } as T;

    this.logger?.({
      category: "aisdk",
      message: "response",
      level: 2,
      auxiliary: {
        response: {
          value: JSON.stringify({
            text: textResponse.text,
            usage: textResponse.usage,
            finishReason: textResponse.finishReason,
            // Omit request and response properties that might contain images
          }),
          type: "object",
        },
        requestId: {
          value: options.requestId,
          type: "string",
        },
      },
    });

    return result;
  }
}


================================================
FILE: packages/evals/llm_clients/hn_aisdk.ts
================================================
// import { Stagehand } from "@browserbasehq/stagehand";
// import { EvalFunction } from "@/types/evals";
// import { z } from "zod";
//
// export const hn_aisdk: EvalFunction = async ({
//   debugUrl,
//   sessionUrl,
//   stagehandConfig,
//   logger,
// }) => {
//   const stagehand = new Stagehand({
//     ...stagehandConfig,
//     modelName: "openai/gpt-4o-mini",
//   });
//   await stagehand.init();
//   await stagehand.page.goto(
//     "https://browserbase.github.io/stagehand-eval-sites/sites/hackernews/",
//   );
//
//   let { story } = await stagehand.page.extract({
//     instruction: "extract the title of the top story on the page",
//     schema: z.object({
//       story: z.string().describe("the title of the top story on the page"),
//     }),
//   });
//   // remove the (url) part of the story title
//   story = story.split(" (")[0];
//
//   const expectedStoryElement = await stagehand.page.$(
//     "xpath=/html/body/center/table/tbody/tr[3]/td/table/tbody/tr[1]/td[3]/span/a",
//   );
//   // remove the (url) part of the story title
//   const expectedStory = (await expectedStoryElement?.textContent())?.split(
//     " (",
//   )?.[0];
//
//   if (!expectedStory) {
//     logger.error({
//       message: "Could not find expected story element",
//       level: 0,
//     });
//     return {
//       _success: false,
//       error: "Could not find expected story element",
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   if (story !== expectedStory) {
//     logger.error({
//       message: "Extracted story does not match expected story",
//       level: 0,
//       auxiliary: {
//         expected: {
//           value: expectedStory,
//           type: "string",
//         },
//         actual: {
//           value: story,
//           type: "string",
//         },
//       },
//     });
//     return {
//       _success: false,
//       error: "Extracted story does not match expected story",
//       expectedStory,
//       actualStory: story,
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   await stagehand.page.act("Click on the 'new' tab");
//
//   if (stagehand.page.url() !== "https://news.ycombinator.com/newest") {
//     logger.error({
//       message: "Page did not navigate to the 'new' tab",
//       level: 0,
//       auxiliary: {
//         expected: {
//           value: "https://news.ycombinator.com/newest",
//           type: "string",
//         },
//         actual: {
//           value: stagehand.page.url(),
//           type: "string",
//         },
//       },
//     });
//     return {
//       _success: false,
//       error: "Page did not navigate to the 'new' tab",
//       expectedUrl: "https://news.ycombinator.com/newest",
//       actualUrl: stagehand.page.url(),
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   await stagehand.close();
//
//   return {
//     _success: true,
//     expectedStory,
//     actualStory: story,
//     debugUrl,
//     sessionUrl,
//     logs: logger.getLogs(),
//   };
// };


================================================
FILE: packages/evals/llm_clients/hn_customOpenAI.ts
================================================
// import { EvalFunction } from "@/types/evals";
// import { z } from "zod";
// import { CustomOpenAIClient } from "@/examples/external_clients/customOpenAI";
// import OpenAI from "openai";
// import { Stagehand } from "@browserbasehq/stagehand";
//
// export const hn_customOpenAI: EvalFunction = async ({
//   logger,
//   stagehandConfig,
//   debugUrl,
//   sessionUrl,
// }) => {
//   const stagehand = new Stagehand({
//     ...stagehandConfig,
//     llmClient: new CustomOpenAIClient({
//       modelName: "gpt-4o-mini",
//       client: new OpenAI({
//         apiKey: process.env.OPENAI_API_KEY,
//       }),
//     }),
//   });
//
//   await stagehand.init();
//
//   await stagehand.page.goto(
//     "https://browserbase.github.io/stagehand-eval-sites/sites/hackernews/",
//   );
//
//   let { story } = await stagehand.page.extract({
//     instruction: "extract the title of the top story on the page",
//     schema: z.object({
//       story: z.string().describe("the title of the top story on the page"),
//     }),
//   });
//   // remove the (url) part of the story title
//   story = story.split(" (")[0];
//
//   const expectedStoryElement = await stagehand.page.$(
//     "xpath=/html/body/center/table/tbody/tr[3]/td/table/tbody/tr[1]/td[3]/span/a",
//   );
//   // remove the (url) part of the story title
//   const expectedStory = (await expectedStoryElement?.textContent())?.split(
//     " (",
//   )?.[0];
//
//   if (!expectedStory) {
//     logger.error({
//       message: "Could not find expected story element",
//       level: 0,
//     });
//     return {
//       _success: false,
//       error: "Could not find expected story element",
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   if (story !== expectedStory) {
//     logger.error({
//       message: "Extracted story does not match expected story",
//       level: 0,
//       auxiliary: {
//         expected: {
//           value: expectedStory,
//           type: "string",
//         },
//         actual: {
//           value: story,
//           type: "string",
//         },
//       },
//     });
//     return {
//       _success: false,
//       error: "Extracted story does not match expected story",
//       expectedStory,
//       actualStory: story,
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   await stagehand.page.act("Click on the 'new' tab");
//
//   if (stagehand.page.url() !== "https://news.ycombinator.com/newest") {
//     logger.error({
//       message: "Page did not navigate to the 'new' tab",
//       level: 0,
//       auxiliary: {
//         expected: {
//           value: "https://news.ycombinator.com/newest",
//           type: "string",
//         },
//         actual: {
//           value: stagehand.page.url(),
//           type: "string",
//         },
//       },
//     });
//     return {
//       _success: false,
//       error: "Page did not navigate to the 'new' tab",
//       expectedUrl: "https://news.ycombinator.com/newest",
//       actualUrl: stagehand.page.url(),
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   await stagehand.close();
//
//   return {
//     _success: true,
//     expectedStory,
//     actualStory: story,
//     debugUrl,
//     sessionUrl,
//     logs: logger.getLogs(),
//   };
// };


================================================
FILE: packages/evals/llm_clients/hn_langchain.ts
================================================
// import { EvalFunction } from "@/types/evals";
// import { z } from "zod";
// import { LangchainClient } from "@/examples/external_clients/langchain";
// import { ChatOpenAI } from "@langchain/openai";
// import { Stagehand } from "@browserbasehq/stagehand";
//
// export const hn_langchain: EvalFunction = async ({
//   logger,
//   stagehandConfig,
//   debugUrl,
//   sessionUrl,
// }) => {
//   const stagehand = new Stagehand({
//     ...stagehandConfig,
//     llmClient: new LangchainClient(
//       new ChatOpenAI({
//         model: "gpt-4o-mini",
//       }),
//     ),
//   });
//   await stagehand.init();
//
//   await stagehand.page.goto(
//     "https://browserbase.github.io/stagehand-eval-sites/sites/hackernews/",
//   );
//
//   let { story } = await stagehand.page.extract({
//     instruction: "extract the title of the top story on the page",
//     schema: z.object({
//       story: z.string().describe("the title of the top story on the page"),
//     }),
//   });
//   // remove the (url) part of the story title
//   story = story.split(" (")[0];
//
//   const expectedStoryElement = await stagehand.page.$(
//     "xpath=/html/body/center/table/tbody/tr[3]/td/table/tbody/tr[1]/td[3]/span/a",
//   );
//   // remove the (url) part of the story title
//   const expectedStory = (await expectedStoryElement?.textContent())?.split(
//     " (",
//   )?.[0];
//
//   if (!expectedStory) {
//     logger.error({
//       message: "Could not find expected story element",
//       level: 0,
//     });
//     return {
//       _success: false,
//       error: "Could not find expected story element",
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   if (story !== expectedStory) {
//     logger.error({
//       message: "Extracted story does not match expected story",
//       level: 0,
//       auxiliary: {
//         expected: {
//           value: expectedStory,
//           type: "string",
//         },
//         actual: {
//           value: story,
//           type: "string",
//         },
//       },
//     });
//     return {
//       _success: false,
//       error: "Extracted story does not match expected story",
//       expectedStory,
//       actualStory: story,
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   await stagehand.page.act("Click on the 'new' tab");
//
//   if (stagehand.page.url() !== "https://news.ycombinator.com/newest") {
//     logger.error({
//       message: "Page did not navigate to the 'new' tab",
//       level: 0,
//       auxiliary: {
//         expected: {
//           value: "https://news.ycombinator.com/newest",
//           type: "string",
//         },
//         actual: {
//           value: stagehand.page.url(),
//           type: "string",
//         },
//       },
//     });
//     return {
//       _success: false,
//       error: "Page did not navigate to the 'new' tab",
//       expectedUrl: "https://news.ycombinator.com/newest",
//       actualUrl: stagehand.page.url(),
//       debugUrl,
//       sessionUrl,
//       logs: logger.getLogs(),
//     };
//   }
//
//   await stagehand.close();
//
//   return {
//     _success: true,
//     expectedStory,
//     actualStory: story,
//     debugUrl,
//     sessionUrl,
//     logs: logger.getLogs(),
//   };
// };


================================================
FILE: packages/evals/logger.ts
================================================
/**
 * This file defines the `EvalLogger` class, which is used to capture and manage
 * log lines during the evaluation process. The logger supports different log
 * levels (info, error, warn), stores logs in memory for later retrieval, and
 * also prints them to the console for immediate feedback.
 *
 * The `parseLogLine` function helps transform raw `LogLine` objects into a more
 * structured format (`LogLineEval`), making auxiliary data easier to understand
 * and analyze. By associating an `EvalLogger` instance with a `Stagehand` object,
 * all logs emitted during the evaluation process can be captured, persisted, and
 * reviewed after the tasks complete.
 */
import { logLineToString } from "./utils.js";
import { LogLineEval } from "./types/evals.js";
import { LogLine } from "@browserbasehq/stagehand";
import type { V3 } from "@browserbasehq/stagehand";

/**
 * parseLogLine:
 * Given a LogLine, attempts to parse its `auxiliary` field into a structured object.
 * If parsing fails, logs an error and returns the original line.
 *
 * The `auxiliary` field in the log line typically contains additional metadata about the log event.
 */
function parseLogLine(logLine: LogLine): LogLineEval {
  try {
    let parsedAuxiliary: Record<string, unknown> | undefined;

    if (logLine.auxiliary) {
      parsedAuxiliary = {};

      for (const [key, entry] of Object.entries(logLine.auxiliary)) {
        try {
          parsedAuxiliary[key] =
            entry.type === "object" ? JSON.parse(entry.value) : entry.value;
        } catch (parseError) {
          console.warn(`Failed to parse auxiliary entry ${key}:`, parseError);
          // If parsing fails, use the raw value
          parsedAuxiliary[key] = entry.value;
        }
      }
    }

    return {
      ...logLine,
      auxiliary: undefined,
      parsedAuxiliary,
    } as LogLineEval;
  } catch (e) {
    console.log("Error parsing log line", logLine);
    console.error(e);
    return logLine;
  }
}

/**
 * EvalLogger:
 * A logger class used during evaluations to capture and print log lines.
 *
 * Capabilities:
 * - Maintains an internal array of log lines (EvalLogger.logs) for later retrieval.
 * - Can be initialized with a Stagehand instance to provide consistent logging.
 * - Supports logging at different levels (info, error, warn).
 * - Each log line is converted to a string and printed to console for immediate feedback.
 * - Also keeps a structured version of the logs that can be returned for analysis or
 *   included in evaluation output.
 */
export class EvalLogger {
  private logs: LogLineEval[] = [];
  stagehand?: V3;

  constructor() {
    this.logs = [];
  }

  /**
   * init:
   * Associates this logger with a given Stagehand instance.
   * This allows the logger to provide additional context if needed.
   */
  init(stagehand?: V3) {
    this.stagehand = stagehand;
  }

  /**
   * log:
   * Logs a message at the default (info) level.
   * Uses `logLineToString` to produce a readable output on the console,
   * and then stores the parsed log line in `this.logs`.
   */
  log(logLine: LogLine) {
    console.log(logLineToString(logLine));
    this.logs.push(parseLogLine(logLine));
  }

  /**
   * error:
   * Logs an error message with `console.error` and stores it.
   * Useful for capturing and differentiating error-level logs.
   */
  error(logLine: LogLine) {
    console.error(logLineToString(logLine));
    this.logs.push(parseLogLine(logLine));
  }

  /**
   * warn:
   * Logs a warning message with `console.warn` and stores it.
   * Helps differentiate warnings from regular info logs.
   */
  warn(logLine: LogLine) {
    console.warn(logLineToString(logLine));
    this.logs.push(parseLogLine(logLine));
  }

  /**
   * getLogs:
   * Retrieves the array of stored log lines.
   * Useful for returning logs after a task completes, for analysis or debugging.
   */
  getLogs(): LogLineEval[] {
    return this.logs || [];
  }

  /**
   * clear:
   * Clears all stored logs to free memory.
   * Should be called after logs have been retrieved and processed.
   */
  clear(): void {
    this.logs = [];
    this.stagehand = undefined;
  }
}


================================================
FILE: packages/evals/package.json
================================================
{
  "name": "@browserbasehq/stagehand-evals",
  "version": "1.1.9",
  "private": true,
  "description": "Evaluation suite for Stagehand",
  "type": "module",
  "main": "./",
  "bin": {
    "evals": "./dist/cli/cli.js"
  },
  "scripts": {
    "typecheck": "pnpm -w --dir ../.. exec tsc -p packages/evals/tsconfig.json --noEmit",
    "build": "pnpm --filter @browserbasehq/stagehand-evals run --parallel \"/^build:(esm|cli)$/\"",
    "build:esm": "tsx scripts/build-esm.ts",
    "build:cli": "tsx scripts/build-cli.ts",
    "test": "pnpm -w --dir ../.. exec turbo run test:evals --filter=@browserbasehq/stagehand-evals --",
    "test:evals": "tsx scripts/test-evals.ts --cli packages/evals/dist/cli/cli.js",
    "lint": "pnpm -w --dir ../.. exec prettier --check packages/evals && pnpm -w --dir ../.. exec eslint packages/evals && pnpm run typecheck",
    "format": "prettier --write ."
  },
  "dependencies": {
    "@ai-sdk/provider": "^2.0.0",
    "@browserbasehq/stagehand": "workspace:*",
    "ai": "^5.0.133",
    "dotenv": "^17.3.1",
    "openai": "^4.87.1",
    "sharp": "^0.34.5",
    "zod": "^4.2.1"
  },
  "devDependencies": {
    "braintrust": "^0.4.7",
    "chalk": "^5.4.1",
    "string-comparison": "^1.3.0",
    "tsx": "*"
  }
}


================================================
FILE: packages/evals/run.ts
================================================
import { spawnSync } from "node:child_process";
import process from "node:process";
import { getCurrentDirPath } from "./runtimePaths.js";

const args: readonly string[] = process.argv.slice(2);
const moduleDir = getCurrentDirPath();

const wantsHelp: boolean = args.some((a) => /^(?:--?)?(?:h|help)$/i.test(a));
const wantsMan: boolean = args.some((a) => /^(?:--?)?man$/i.test(a));

// Skip build if just showing help
if (!wantsHelp && !wantsMan) {
  const build = spawnSync("pnpm", ["run", "build"], {
    stdio: "inherit",
    cwd: "../..",
  });
  if (build.status !== 0) process.exit(build.status ?? 1);
}

const run = spawnSync("tsx", ["index.eval.ts", ...args], {
  stdio: "inherit",
  cwd: moduleDir,
});
process.exit(run.status ?? 0);


================================================
FILE: packages/evals/runtimePaths.ts
================================================
/**
 * Keep this file in sync with:
 * - /packages/core/lib/v3/runtimePaths.ts
 * - /packages/server-v3/scripts/runtimePaths.ts
 * - /packages/server-v4/scripts/runtimePaths.ts
 * - /packages/evals/runtimePaths.ts
 * - /packages/docs/scripts/runtimePaths.js
 */
import path from "node:path";
import { fileURLToPath } from "node:url";
import { createRequire } from "node:module";

const PACKAGE_SEGMENT = "/packages/evals/";
const EVAL_FRAMES = new Set(["[eval]", "[eval]-wrapper"]);
const INTERNAL_FRAME_NAMES = new Set([
  "readCallsites",
  "readCallsitePath",
  "resolveCallerFilePath",
  "getCurrentFilePath",
  "getCurrentDirPath",
  "getRepoRootDir",
  "getPackageRootDir",
  "createRequireFromCaller",
  "isMainModule",
]);

const normalizePath = (value: string): string => {
  const input = value.startsWith("file://") ? fileURLToPath(value) : value;
  return path.resolve(input).replaceAll("\\", "/");
};

const readCallsites = (): NodeJS.CallSite[] => {
  const previousPrepare = Error.prepareStackTrace;
  try {
    Error.prepareStackTrace = (_, stack) => stack;
    return (
      (new Error().stack as unknown as NodeJS.CallSite[] | undefined) ?? []
    );
  } finally {
    Error.prepareStackTrace = previousPrepare;
  }
};

type CallSiteWithScriptName = NodeJS.CallSite & {
  getScriptNameOrSourceURL?: () => string | null;
};

const readCallsitePath = (callsite: NodeJS.CallSite): string | null => {
  const callsiteWithScript = callsite as CallSiteWithScriptName;
  const rawPath =
    callsite.getFileName() ?? callsiteWithScript.getScriptNameOrSourceURL?.();
  if (!rawPath) return null;
  if (rawPath.startsWith("node:")) return null;
  if (EVAL_FRAMES.has(rawPath)) return null;
  return normalizePath(rawPath);
};

const isInternalCallsite = (callsite: NodeJS.CallSite): boolean => {
  const functionName = callsite.getFunctionName();
  if (functionName && INTERNAL_FRAME_NAMES.has(functionName)) return true;

  const methodName = callsite.getMethodName();
  if (methodName && INTERNAL_FRAME_NAMES.has(methodName)) return true;

  const callsiteString = callsite.toString();
  for (const frameName of INTERNAL_FRAME_NAMES) {
    if (callsiteString.includes(`${frameName} (`)) return true;
    if (callsiteString.includes(`.${frameName} (`)) return true;
  }
  return false;
};

const resolveCallerFilePath = (): string => {
  const packageCandidates: string[] = [];
  const fallbackCandidates: string[] = [];

  for (const callsite of readCallsites()) {
    const filePath = readCallsitePath(callsite);
    if (!filePath) continue;
    if (isInternalCallsite(callsite)) continue;
    if (filePath.includes(PACKAGE_SEGMENT)) {
      packageCandidates.push(filePath);
      continue;
    }
    fallbackCandidates.push(filePath);
  }

  const packageCandidate = packageCandidates[0];
  if (packageCandidate) return packageCandidate;

  const fallbackCandidate = fallbackCandidates[0];
  if (fallbackCandidate) return fallbackCandidate;

  throw new Error("Unable to resolve caller file path.");
};

export const getCurrentFilePath = (): string => resolveCallerFilePath();

export const getCurrentDirPath = (): string =>
  path.dirname(getCurrentFilePath());

export const getRepoRootDir = (): string => {
  const currentFilePath = getCurrentFilePath();
  const index = currentFilePath.lastIndexOf(PACKAGE_SEGMENT);
  if (index === -1) {
    throw new Error(
      `Unable to determine repo root from ${currentFilePath} (missing ${PACKAGE_SEGMENT}).`,
    );
  }
  return currentFilePath.slice(0, index);
};

export const getPackageRootDir = (): string =>
  `${getRepoRootDir()}${PACKAGE_SEGMENT.slice(0, -1)}`;

export const createRequireFromCaller = () =>
  createRequire(getCurrentFilePath());

export const isMainModule = (): boolean => {
  const entryScript = process.argv.at(1);
  if (!entryScript) return false;
  return normalizePath(entryScript) === getCurrentFilePath();
};


================================================
FILE: packages/evals/scoring.ts
================================================
/**
 * This file implements scoring functions needed by braintrust.
 */

import { EvalArgs, EvalInput, EvalResult } from "./types/evals.js";

function formatTaskOutput(output: unknown): string {
  let value: string | undefined;
  if (typeof output === "string") {
    value = output;
  } else if (output instanceof Error) {
    value = output.stack ?? `${output.name}: ${output.message}`;
  } else {
    try {
      value = JSON.stringify(output, (_key, current) => {
        if (current instanceof Error) {
          return {
            name: current.name,
            message: current.message,
            stack: current.stack,
          };
        }
        return current;
      });
    } catch {
      value = undefined;
    }
    if (value === undefined) {
      value = String(output);
    }
  }

  if (value.length > 160) {
    return `${value.slice(0, 157)}...`;
  }
  return value;
}

/**
 * Scoring function: exactMatch
 * Given the arguments (including input, output, and expected result),
 * this returns a score of 1 if the result matches the expectation, and 0 otherwise.
 *
 * If "expected" is true, it checks if the output indicates success.
 * If "expected" is a boolean or an object with _success flag,
 * it checks if output is exactly that success condition.
 */
export function exactMatch(
  args: EvalArgs<EvalInput, boolean | { _success: boolean }, unknown>,
): EvalResult {
  console.log(
    `Task "${args.input.name}" returned: ${formatTaskOutput(args.output)}`,
  );

  const expected = args.expected ?? true;
  if (expected === true) {
    // If we expect a success (true), then we check the output's _success flag.
    return {
      name: "Exact match",
      score:
        typeof args.output === "boolean"
          ? args.output
            ? 1
            : 0
          : args.output._success
            ? 1
            : 0,
    };
  }

  // If expected is not true, just directly compare the output to expected.
  return {
    name: "Exact match",
    score: args.output === expected ? 1 : 0,
  };
}

/**
 * Scoring function: errorMatch
 * Determines if an error occurred in the task.
 * Scores 1 if an error is found, otherwise 0.
 */
export function errorMatch(
  args: EvalArgs<
    EvalInput,
    boolean | { _success: boolean; error?: unknown },
    unknown
  >,
): EvalResult {
  console.log(
    `Task "${args.input.name}" returned: ${formatTaskOutput(args.output)}`,
  );

  return {
    name: "Error rate",
    score:
      typeof args.output === "object" && args.output.error !== undefined
        ? 1
        : 0,
  };
}


================================================
FILE: packages/evals/scripts/build-cli.ts
================================================
/**
 * Build the evals CLI (packages/evals/dist/cli/cli.js + config), including a node shebang.
 *
 * Prereqs: pnpm install.
 * Args: none.
 * Env: none.
 * Example: pnpm run build:cli
 */
import fs from "node:fs";
import { spawnSync } from "node:child_process";
import { getRepoRootDir } from "../runtimePaths.js";

const repoRoot = getRepoRootDir();

const run = (args: string[]) => {
  const result = spawnSync("pnpm", args, { stdio: "inherit", cwd: repoRoot });
  if (result.status !== 0) {
    process.exit(result.status ?? 1);
  }
};

fs.mkdirSync(`${repoRoot}/packages/evals/dist/cli`, { recursive: true });

run([
  "exec",
  "esbuild",
  "packages/evals/cli.ts",
  "--bundle",
  "--platform=node",
  "--format=esm",
  `--outfile=${repoRoot}/packages/evals/dist/cli/cli.js`,
  "--sourcemap",
  "--packages=external",
  "--banner:js=#!/usr/bin/env node",
  "--log-level=warning",
]);

/* ── merge config: always update tasks/benchmarks from source, but preserve user defaults ── */
const sourceConfig = JSON.parse(
  fs.readFileSync(`${repoRoot}/packages/evals/evals.config.json`, "utf-8"),
);
const distConfigPath = `${repoRoot}/packages/evals/dist/cli/evals.config.json`;

if (fs.existsSync(distConfigPath)) {
  try {
    const existing = JSON.parse(fs.readFileSync(distConfigPath, "utf-8"));
    if (existing.defaults) {
      sourceConfig.defaults = {
        ...sourceConfig.defaults,
        ...existing.defaults,
      };
    }
  } catch {
    // invalid existing config – overwrite entirely
  }
}

fs.writeFileSync(distConfigPath, JSON.stringify(sourceConfig, null, 2) + "\n");
fs.writeFileSync(
  `${repoRoot}/packages/evals/dist/cli/package.json`,
  '{\n  "type": "module"\n}\n',
);
fs.chmodSync(`${repoRoot}/packages/evals/dist/cli/cli.js`, 0o755);

/* ── auto-link the `evals` binary globally ── */
const link = spawnSync("npm", ["link", "--force"], {
  stdio: "inherit",
  cwd: `${repoRoot}/packages/evals`,
});
if (link.status !== 0) {
  console.warn(
    "⚠  npm link failed (non-fatal) – you can run `npm link` manually from packages/evals",
  );
}


================================================
FILE: packages/evals/scripts/build-esm.ts
================================================
/**
 * Build canonical dist/esm output for evals (plus assets/config).
 *
 * Prereqs: pnpm install.
 * Args: none.
 * Env: none.
 * Example: pnpm run build:esm
 */
import fs from "node:fs";
import { spawnSync } from "node:child_process";
import { getRepoRootDir } from "../runtimePaths.js";

const repoRoot = getRepoRootDir();

const run = (args: string[]) => {
  const result = spawnSync("pnpm", args, { stdio: "inherit", cwd: repoRoot });
  if (result.status !== 0) {
    process.exit(result.status ?? 1);
  }
};

fs.rmSync(`${repoRoot}/packages/evals/dist/esm`, {
  recursive: true,
  force: true,
});
// Evals run from dist/esm JS, but still need config/assets/datasets on disk.
run(["exec", "tsc", "-p", "packages/evals/tsconfig.json"]);

fs.mkdirSync(`${repoRoot}/packages/evals/dist/esm`, { recursive: true });
fs.writeFileSync(
  `${repoRoot}/packages/evals/dist/esm/package.json`,
  '{\n  "type": "module"\n}\n',
);

const copyFile = (filename: string) => {
  const src = `${repoRoot}/packages/evals/${filename}`;
  if (fs.existsSync(src)) {
    fs.copyFileSync(src, `${repoRoot}/packages/evals/dist/esm/${filename}`);
  }
};

const copyDir = (dirname: string) => {
  const srcDir = `${repoRoot}/packages/evals/${dirname}`;
  if (fs.existsSync(srcDir)) {
    fs.cpSync(srcDir, `${repoRoot}/packages/evals/dist/esm/${dirname}`, {
      recursive: true,
    });
  }
};

copyFile("evals.config.json");
copyDir("datasets");
copyDir("assets");


================================================
FILE: packages/evals/scripts/test-evals.ts
================================================
/**
 * Eval runs via the evals CLI from source or dist/esm.
 *
 * Prereqs: source mode uses tsx loader; dist mode requires compiled CLI output.
 * Args: [target] [options...] (passed to evals run) | --cli <path> [target] [options...] | --list (prints JSON matrix).
 * Env: STAGEHAND_BROWSER_TARGET=local|browserbase, NODE_V8_COVERAGE, NODE_OPTIONS;
 *      writes JUnit to ctrf/evals/<target>.xml and CTRF to ctrf/evals/<target>.json.
 * Example: STAGEHAND_BROWSER_TARGET=browserbase pnpm run test:evals -- act -t 3 -c 10
 */
import fs from "node:fs";
import path from "node:path";
import { spawnSync } from "node:child_process";
import { getCurrentFilePath, getRepoRootDir } from "../runtimePaths.js";

type Runtime = "source" | "dist-esm";

type EvalSummaryEntry = {
  eval: string;
  model: string;
  categories?: string[];
};

type EvalSummary = {
  passed?: EvalSummaryEntry[];
  failed?: EvalSummaryEntry[];
};

const toSafeName = (name: string) => name.replace(/[\\/]/g, "-");

const readEvalSummary = (summaryPath: string): EvalSummary | null => {
  if (!fs.existsSync(summaryPath)) return null;
  try {
    return JSON.parse(fs.readFileSync(summaryPath, "utf8")) as EvalSummary;
  } catch (error) {
    console.warn(
      `Failed to parse eval summary at ${summaryPath}: ${String(error)}`,
    );
    return null;
  }
};

const escapeXml = (value: string) =>
  value
    .replaceAll("&", "&amp;")
    .replaceAll("<", "&lt;")
    .replaceAll(">", "&gt;")
    .replaceAll('"', "&quot;")
    .replaceAll("'", "&apos;");

const writeEvalJunit = (
  summaryPath: string,
  outputPath: string,
  category: string,
) => {
  const summary = readEvalSummary(summaryPath);
  const passed = summary?.passed ?? [];
  const failed = summary?.failed ?? [];
  const missingSummary = summary === null;
  const tests = missingSummary ? 1 : passed.length + failed.length;
  const failures = missingSummary ? 1 : failed.length;
  const suiteName = `evals-${category}`;
  const cases: string[] = [];

  if (missingSummary) {
    cases.push(
      `    <testcase name="${escapeXml(`evals/${category} summary missing`)}" classname="${escapeXml(suiteName)}" time="0">`,
      `      <failure message="eval summary missing">Missing eval summary at ${escapeXml(summaryPath)}</failure>`,
      "    </testcase>",
    );
  } else {
    for (const item of passed) {
      cases.push(
        `    <testcase name="${escapeXml(`evals/${item.eval} [${item.model}]`)}" classname="${escapeXml(suiteName)}" time="0" />`,
      );
    }
    for (const item of failed) {
      cases.push(
        `    <testcase name="${escapeXml(`evals/${item.eval} [${item.model}]`)}" classname="${escapeXml(suiteName)}" time="0">`,
        `      <failure message="eval failed">${escapeXml(`categories=${(item.categories ?? []).join(",")}`)}</failure>`,
        "    </testcase>",
      );
    }
  }

  const xml = [
    '<?xml version="1.0" encoding="utf-8"?>',
    "<testsuites>",
    `  <testsuite name="${escapeXml(suiteName)}" tests="${tests}" failures="${failures}" errors="0" skipped="0" time="0">`,
    ...cases,
    "  </testsuite>",
    "</testsuites>",
    "",
  ].join("\n");

  fs.writeFileSync(outputPath, xml);
};

const writeEvalCtrf = (
  summaryPath: string,
  outputPath: string,
  category: string,
) => {
  const timestamp = new Date().toISOString();
  const summary = readEvalSummary(summaryPath);
  if (summary) {
    const passed = summary.passed ?? [];
    const failed = summary.failed ?? [];
    const toTests = (arr: typeof passed, status: "passed" | "failed") =>
      arr.map((item) => ({
        name: `evals/${item.eval} [${item.model}]`,
        status,
        duration: 0,
        suite: ["evals", category, ...(item.categories ?? [])],
      }));
    const report = {
      reportFormat: "CTRF",
      specVersion: "0.0.0",
      generatedBy: "stagehand-evals",
      timestamp,
      results: {
        tool: { name: "evals" },
        summary: {
          tests: passed.length + failed.length,
          passed: passed.length,
          failed: failed.length,
          skipped: 0,
          pending: 0,
          other: 0,
          start: 0,
          stop: 0,
        },
        tests: [...toTests(passed, "passed"), ...toTests(failed, "failed")],
      },
    };
    fs.writeFileSync(outputPath, JSON.stringify(report, null, 2));
    return;
  }

  const missingReport = {
    reportFormat: "CTRF",
    specVersion: "0.0.0",
    generatedBy: "stagehand-evals",
    timestamp,
    results: {
      tool: { name: "evals" },
      summary: {
        tests: 1,
        passed: 0,
        failed: 1,
        skipped: 0,
        pending: 0,
        other: 0,
        start: 0,
        stop: 0,
      },
      tests: [
        {
          name: `evals/${category} summary missing`,
          status: "failed",
          duration: 0,
          suite: ["evals", category],
        },
      ],
    },
  };
  fs.writeFileSync(outputPath, JSON.stringify(missingReport, null, 2));
};

const repoRoot = getRepoRootDir();
const toPosix = (value: string) => value.replaceAll("\\", "/");
const resolveRepoRelative = (value: string) =>
  path.isAbsolute(value) ? value : path.resolve(repoRoot, value);
const inferRuntimeFromPath = (value: string) => {
  const normalized = toPosix(value);
  if (normalized.includes("/dist/cli/") || normalized.includes("/dist/esm/")) {
    return "dist-esm" as const;
  }
  return null;
};
const inferRuntimeFromExecution = () =>
  inferRuntimeFromPath(getCurrentFilePath()) ??
  inferRuntimeFromPath(process.cwd());
const rawArgs = process.argv.slice(2).filter((arg) => arg !== "--");
const listRequested = rawArgs.includes("--list");
const stripCliArg = (values: string[]) => {
  const filtered: string[] = [];
  let cliPath: string | null = null;
  for (let i = 0; i < values.length; i++) {
    const arg = values[i];
    if (arg === "--cli") {
      if (values[i + 1] && !values[i + 1].startsWith("--")) {
        cliPath = values[i + 1];
        i += 1;
      } else {
        cliPath = "";
      }
      continue;
    }
    if (arg.startsWith("--cli=")) {
      cliPath = arg.slice("--cli=".length);
      continue;
    }
    filtered.push(arg);
  }
  return { filtered, cliPath };
};
const strippedCli = stripCliArg(rawArgs.filter((arg) => arg !== "--list"));
if (strippedCli.cliPath === "") {
  console.error("Missing value for --cli.");
  process.exit(1);
}
const args = strippedCli.filtered;

if (listRequested) {
  const categories = (
    process.env.EVAL_CATEGORIES ??
    "observe,act,combination,extract,targeted_extract,regression,agent"
  ).split(",");
  const entries = categories.map((category) => ({
    category,
    name: category,
    safe_name: toSafeName(category),
  }));
  console.log(JSON.stringify(entries));
  process.exit(0);
}

if (
  strippedCli.cliPath &&
  toPosix(resolveRepoRelative(strippedCli.cliPath)).includes("/dist/cjs/")
) {
  console.error("CJS eval runtime is not supported. Use source or dist/cli.");
  process.exit(1);
}

const runtime: Runtime =
  (strippedCli.cliPath
    ? inferRuntimeFromPath(resolveRepoRelative(strippedCli.cliPath))
    : null) ??
  inferRuntimeFromExecution() ??
  "source";

const cliPath = strippedCli.cliPath
  ? resolveRepoRelative(strippedCli.cliPath)
  : runtime === "source"
    ? `${repoRoot}/packages/evals/cli.ts`
    : `${repoRoot}/packages/evals/dist/cli/cli.js`;
if (!fs.existsSync(cliPath)) {
  console.error(`Missing ${cliPath}.`);
  process.exit(1);
}

if (args.includes("--help") || args.includes("-h") || args[0] === "help") {
  const result = spawnSync(
    process.execPath,
    [...(runtime === "source" ? ["--import", "tsx"] : []), cliPath, "--help"],
    {
      stdio: "inherit",
      cwd: repoRoot,
    },
  );
  process.exit(result.status ?? 0);
}

const hasRun = args[0] === "run";
const argsAfterRun = hasRun ? args.slice(1) : args;
const target =
  argsAfterRun.find((arg) => !arg.startsWith("-"))?.trim() || "all";
const safeTarget = toSafeName(target);
const cliArgs = hasRun ? args : ["run", ...args];

const baseNodeOptions = "--enable-source-maps";
const nodeOptions = [process.env.NODE_OPTIONS, baseNodeOptions]
  .filter(Boolean)
  .join(" ");

const coverageDir = resolveRepoRelative(
  process.env.NODE_V8_COVERAGE ?? `${repoRoot}/coverage/evals/${safeTarget}`,
);
fs.mkdirSync(coverageDir, { recursive: true });
const summaryPath = `${repoRoot}/eval-summary.json`;
fs.mkdirSync(`${repoRoot}/ctrf/evals`, { recursive: true });
const junitPath = `${repoRoot}/ctrf/evals/${safeTarget}.xml`;
const ctrfPath = `${repoRoot}/ctrf/evals/${safeTarget}.json`;

const env = {
  ...process.env,
  NODE_OPTIONS: nodeOptions,
  NODE_V8_COVERAGE: coverageDir,
};

const result = spawnSync(
  process.execPath,
  [...(runtime === "source" ? ["--import", "tsx"] : []), cliPath, ...cliArgs],
  {
    stdio: "inherit",
    env,
    cwd: repoRoot,
  },
);

writeEvalJunit(summaryPath, junitPath, safeTarget);
writeEvalCtrf(summaryPath, ctrfPath, safeTarget);

process.exit(result.status ?? 1);


================================================
FILE: packages/evals/suites/gaia.ts
================================================
import path from "path";
import type { Testcase, EvalInput } from "../types/evals.js";
import type { AvailableModel } from "@browserbasehq/stagehand";
import { tasksConfig } from "../taskConfig.js";
import { getCurrentDirPath } from "../runtimePaths.js";
import { readJsonlFile, parseJsonlRows, applySampling } from "../utils.js";

export const buildGAIATestcases = (models: string[]): Testcase[] => {
  const moduleDir = getCurrentDirPath();
  const gaiaFilePath =
    process.env.EVAL_GAIA_FILE ||
    path.join(moduleDir, "..", "datasets", "gaia", "GAIA_web.jsonl");

  const gaiaLines = readJsonlFile(gaiaFilePath);

  const levelFilter = process.env.EVAL_GAIA_LEVEL
    ? Number(process.env.EVAL_GAIA_LEVEL)
    : undefined;
  // Use EVAL_MAX_K if set, otherwise fall back to EVAL_GAIA_LIMIT or default to 25
  const maxCases = process.env.EVAL_MAX_K
    ? Number(process.env.EVAL_MAX_K)
    : process.env.EVAL_GAIA_LIMIT
      ? Number(process.env.EVAL_GAIA_LIMIT)
      : 25;
  const sampleCount = process.env.EVAL_GAIA_SAMPLE
    ? Number(process.env.EVAL_GAIA_SAMPLE)
    : undefined;

  type GaiaRow = {
    id: string;
    Level?: number;
    web: string;
    ques: string;
    [key: string]: unknown;
  };

  function isGaiaRow(parsed: unknown): parsed is GaiaRow {
    if (parsed === null || typeof parsed !== "object") return false;
    const obj = parsed as Record<string, unknown>;
    return (
      typeof obj.id === "string" &&
      typeof obj.web === "string" &&
      typeof obj.ques === "string"
    );
  }

  const candidates = parseJsonlRows(gaiaLines, isGaiaRow);

  // Filter by level if specified
  const filteredCandidates = levelFilter
    ? candidates.filter((row) => row.Level === levelFilter)
    : candidates;

  const gaiaRows = applySampling(filteredCandidates, sampleCount, maxCases);

  const allTestcases: Testcase[] = [];
  for (const model of models) {
    for (const row of gaiaRows) {
      const finalAnswer = (row as Record<string, unknown>)[
        "Final answer"
      ] as unknown;
      const input: EvalInput = {
        name: "agent/gaia",
        modelName: model as AvailableModel,
        params: {
          id: row.id,
          level: row.Level,
          web: row.web,
          ques: row.ques,
          expected: typeof finalAnswer === "string" ? finalAnswer : undefined,
        },
      };
      allTestcases.push({
        input,
        name: input.name,
        tags: [
          model,
          input.name,
          ...(
            tasksConfig.find((t) => t.name === input.name)?.categories || []
          ).map((x) => `category/${x}`),
          `gaia/id/${row.id}`,
          row.Level ? `gaia/level/${row.Level}` : "gaia/level/unknown",
        ],
        metadata: {
          model: model as AvailableModel,
          test: `${input.name}:${row.id}`,
        },
        expected: true,
      });
    }
  }

  return allTestcases;
};


================================================
FILE: packages/evals/suites/onlineMind2Web.ts
================================================
import path from "path";
import type { Testcase, EvalInput } from "../types/evals.js";
import type { AvailableModel } from "@browserbasehq/stagehand";
import { tasksConfig } from "../taskConfig.js";
import { getCurrentDirPath } from "../runtimePaths.js";
import { readJsonlFile, parseJsonlRows, applySampling } from "../utils.js";

export const buildOnlineMind2WebTestcases = (models: string[]): Testcase[] => {
  const moduleDir = getCurrentDirPath();
  const mind2webFilePath = path.join(
    moduleDir,
    "..",
    "datasets",
    "onlineMind2Web",
    "onlineMind2Web.jsonl",
  );

  const lines = readJsonlFile(mind2webFilePath);

  // Use EVAL_MAX_K if set, otherwise fall back to EVAL_ONLINEMIND2WEB_LIMIT or default to 25
  const maxCases = process.env.EVAL_MAX_K
    ? Number(process.env.EVAL_MAX_K)
    : process.env.EVAL_ONLINEMIND2WEB_LIMIT
      ? Number(process.env.EVAL_ONLINEMIND2WEB_LIMIT)
      : 25;
  const sampleCount = process.env.EVAL_ONLINEMIND2WEB_SAMPLE
    ? Number(process.env.EVAL_ONLINEMIND2WEB_SAMPLE)
    : undefined;

  type Mind2WebRow = {
    task_id: string;
    confirmed_task: string;
    website: string;
    reference_length?: number;
    level?: string;
    [key: string]: unknown;
  };

  function isMind2WebRow(parsed: unknown): parsed is Mind2WebRow {
    if (parsed === null || typeof parsed !== "object") return false;
    const obj = parsed as Record<string, unknown>;
    return (
      typeof obj.task_id === "string" &&
      typeof obj.confirmed_task === "string" &&
      typeof obj.website === "string"
    );
  }

  const candidates = parseJsonlRows(lines, isMind2WebRow);
  const rows = applySampling(candidates, sampleCount, maxCases);

  const allTestcases: Testcase[] = [];
  for (const model of models) {
    for (const row of rows) {
      const input: EvalInput = {
        name: "agent/onlineMind2Web",
        modelName: model as AvailableModel,
        params: {
          task_id: row.task_id,
          confirmed_task: row.confirmed_task,
          website: row.website,
          reference_length: row.reference_length,
          level: row.level,
        },
      };
      const taskCategories =
        tasksConfig.find((t) => t.name === input.name)?.categories || [];
      allTestcases.push({
        input,
        name: input.name,
        tags: [
          model,
          "mind2web", // Simple dataset tag
        ],
        metadata: {
          model: model as AvailableModel,
          test: `${input.name}:${row.task_id}`,
          category: taskCategories[0] || "agent",
          categories: taskCategories,
          dataset: "onlineMind2Web",
          task_id: row.task_id,
          difficulty: row.level,
          website: row.website,
        },
        expected: true,
      });
    }
  }

  return allTestcases;
};


================================================
FILE: packages/evals/suites/webtailbench.ts
================================================
import type { Testcase, EvalInput } from "../types/evals.js";
import type { AvailableModel } from "@browserbasehq/stagehand";
import { tasksConfig } from "../taskConfig.js";
import { getCurrentDirPath } from "../runtimePaths.js";
import { readJsonlFile, parseJsonlRows, applySampling } from "../utils.js";

export const buildWebTailBenchTestcases = (models: string[]): Testcase[] => {
  const moduleDir = getCurrentDirPath();
  const webtailbenchFilePath =
    moduleDir + "/../datasets/webtailbench/WebTailBench_data.jsonl";

  const lines = readJsonlFile(webtailbenchFilePath);

  // Use EVAL_MAX_K if set, otherwise fall back to EVAL_WEBTAILBENCH_LIMIT or default to 25
  const maxCases = process.env.EVAL_MAX_K
    ? Number(process.env.EVAL_MAX_K)
    : process.env.EVAL_WEBTAILBENCH_LIMIT
      ? Number(process.env.EVAL_WEBTAILBENCH_LIMIT)
      : 25;
  const sampleCount = process.env.EVAL_WEBTAILBENCH_SAMPLE
    ? Number(process.env.EVAL_WEBTAILBENCH_SAMPLE)
    : undefined;

  type WebTailBenchRow = {
    id: string;
    ques: string;
    category?: string;
    web?: string;
    [key: string]: unknown;
  };

  function isWebTailBenchRow(parsed: unknown): parsed is WebTailBenchRow {
    if (parsed === null || typeof parsed !== "object") return false;
    const obj = parsed as Record<string, unknown>;
    return typeof obj.id === "string" && typeof obj.ques === "string";
  }

  const candidates = parseJsonlRows(lines, isWebTailBenchRow);
  const rows = applySampling(candidates, sampleCount, maxCases);

  const allTestcases: Testcase[] = [];
  for (const model of models) {
    for (const row of rows) {
      const input: EvalInput = {
        name: "agent/webtailbench",
        modelName: model as AvailableModel,
        params: {
          id: row.id,
          category: row.category,
          ques: row.ques,
          web: row.web,
        },
      };
      const taskCategories =
        tasksConfig.find((t) => t.name === input.name)?.categories || [];
      allTestcases.push({
        input,
        name: input.name,
        tags: [model, "webtailbench"],
        metadata: {
          model: model as AvailableModel,
          test: `${input.name}:${row.id}`,
          category: taskCategories[0] || "agent",
          categories: taskCategories,
          dataset: "webtailbench",
          task_id: row.id,
          task_category: row.category,
        },
        expected: true,
      });
    }
  }

  return allTestcases;
};


================================================
FILE: packages/evals/suites/webvoyager.ts
================================================
import path from "path";
import type { Testcase, EvalInput } from "../types/evals.js";
import type { AvailableModel } from "@browserbasehq/stagehand";
import { tasksConfig } from "../taskConfig.js";
import { getCurrentDirPath } from "../runtimePaths.js";
import { readJsonlFile, parseJsonlRows, applySampling } from "../utils.js";

export const buildWebVoyagerTestcases = (models: string[]): Testcase[] => {
  const moduleDir = getCurrentDirPath();
  const voyagerFilePath = path.join(
    moduleDir,
    "..",
    "datasets",
    "webvoyager",
    "WebVoyager_data.jsonl",
  );

  const lines = readJsonlFile(voyagerFilePath);

  // Use EVAL_MAX_K if set, otherwise fall back to EVAL_WEBVOYAGER_LIMIT or default to 25
  const maxCases = process.env.EVAL_MAX_K
    ? Number(process.env.EVAL_MAX_K)
    : process.env.EVAL_WEBVOYAGER_LIMIT
      ? Number(process.env.EVAL_WEBVOYAGER_LIMIT)
      : 25;
  const sampleCount = process.env.EVAL_WEBVOYAGER_SAMPLE
    ? Number(process.env.EVAL_WEBVOYAGER_SAMPLE)
    : undefined;

  type VoyagerRow = {
    id: string;
    web: string;
    ques: string;
    web_name?: string;
    [key: string]: unknown;
  };

  function isVoyagerRow(parsed: unknown): parsed is VoyagerRow {
    if (parsed === null || typeof parsed !== "object") return false;
    const obj = parsed as Record<string, unknown>;
    return (
      typeof obj.id === "string" &&
      typeof obj.web === "string" &&
      typeof obj.ques === "string"
    );
  }

  const candidates = parseJsonlRows(lines, isVoyagerRow);
  const rows = applySampling(candidates, sampleCount, maxCases);

  const allTestcases: Testcase[] = [];
  for (const model of models) {
    for (const row of rows) {
      const input: EvalInput = {
        name: "agent/webvoyager",
        modelName: model as AvailableModel,
        params: {
          id: row.id,
          web: row.web,
          ques: row.ques,
          web_name: row.web_name,
        },
      };
      const taskCategories =
        tasksConfig.find((t) => t.name === input.name)?.categories || [];
      allTestcases.push({
        input,
        name: input.name,
        tags: [
          model,
          "webvoyager", // Simple dataset tag
        ],
        metadata: {
          model: model as AvailableModel,
          test: `${input.name}:${row.id}`,
          category: taskCategories[0] || "agent",
          categories: taskCategories,
          dataset: "webvoyager",
          task_id: row.id,
          website: row.web_name || row.web,
        },
        expected: true,
      });
    }
  }

  return allTestcases;
};


================================================
FILE: packages/evals/summary.ts
================================================
import fs from "fs";
import { tasksByName } from "./taskConfig.js";
import type { SummaryResult } from "./types/evals.js";
import { getRepoRootDir } from "./runtimePaths.js";

const repoRoot = getRepoRootDir();

export const generateSummary = async (
  results: SummaryResult[],
  experimentName: string,
) => {
  const passed = results
    .filter((r) => r.output._success)
    .map((r) => ({
      eval: r.input.name,
      model: r.input.modelName,
      categories: tasksByName[r.input.name].categories,
    }));

  const failed = results
    .filter((r) => !r.output._success)
    .map((r) => ({
      eval: r.input.name,
      model: r.input.modelName,
      categories: tasksByName[r.input.name].categories,
    }));

  const categorySuccessCounts: Record<
    string,
    { total: number; success: number }
  > = {};
  for (const taskName of Object.keys(tasksByName)) {
    const taskCategories = tasksByName[taskName].categories;
    const taskResults = results.filter((r) => r.input.name === taskName);
    const successCount = taskResults.filter((r) => r.output._success).length;

    for (const cat of taskCategories) {
      if (!categorySuccessCounts[cat]) {
        categorySuccessCounts[cat] = { total: 0, success: 0 };
      }
      categorySuccessCounts[cat].total += taskResults.length;
      categorySuccessCounts[cat].success += successCount;
    }
  }

  const categories: Record<string, number> = {};
  for (const [cat, counts] of Object.entries(categorySuccessCounts)) {
    categories[cat] = Math.round((counts.success / counts.total) * 100);
  }

  const models: Record<string, number> = {};
  const allModels = [...new Set(results.map((r) => r.input.modelName))];
  for (const model of allModels) {
    const modelResults = results.filter((r) => r.input.modelName === model);
    const successCount = modelResults.filter((r) => r.output._success).length;
    models[model] = Math.round((successCount / modelResults.length) * 100);
  }

  const formattedSummary = {
    experimentName,
    passed,
    failed,
    categories,
    models,
  };

  const summaryPath = `${repoRoot}/eval-summary.json`;
  fs.writeFileSync(summaryPath, JSON.stringify(formattedSummary, null, 2));
  console.log(`Evaluation summary written to ${summaryPath}`);
};


================================================
FILE: packages/evals/taskConfig.ts
================================================
/**
 * This file is responsible for:
 * - Loading and parsing the `evals.config.json` file, which defines tasks (evaluations) and their associated categories.
 * - Building a lookup structure (`tasksByName`) to map each task name to its categories.
 * - Filtering tasks based on command-line arguments (e.g., `filterByEvalName`) and ensuring that requested tasks exist.
 * - Determining which models to use for evaluations, depending on the category and environment variables.
 * - Validating that the chosen models are supported.
 *
 * The exported objects (`tasksByName`, `MODELS`, `config`) are used by the main evaluation script and other modules
 * to know which tasks and models are available, and to configure the evaluations accordingly.
 */

import fs from "fs";
import path from "path";
import { AvailableModel } from "@browserbasehq/stagehand";
import { filterByEvalName } from "./args.js";
import { AgentModelEntry } from "./types/evals.js";
import { getCurrentDirPath } from "./runtimePaths.js";

const ALL_EVAL_MODELS = [
  // GOOGLE
  "gemini-2.0-flash",
  "gemini-2.0-flash-lite",
  "gemini-1.5-flash",
  "gemini-2.5-pro-exp-03-25",
  "gemini-1.5-pro",
  "gemini-1.5-flash-8b",
  "gemini-2.5-flash-preview-04-17",
  "gemini-2.5-pro-preview-03-25",
  // ANTHROPIC
  "claude-sonnet-4-6",
  // OPENAI
  "gpt-4o-mini",
  "gpt-4o",
  "gpt-4.5-preview",
  "o3",
  "o3-mini",
  "o4-mini",
  // TOGETHER - META
  "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
  "meta-llama/Llama-3.3-70B-Instruct-Turbo",
  "meta-llama/Llama-4-Scout-17B-16E-Instruct",
  "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
  // TOGETHER - DEEPSEEK
  "deepseek-ai/DeepSeek-V3",
  "Qwen/Qwen2.5-7B-Instruct-Turbo",
  // GROQ
  "groq/meta-llama/llama-4-scout-17b-16e-instruct",
  "groq/llama-3.3-70b-versatile",
  "groq/llama3-70b-8192",
  "groq/qwen-qwq-32b",
  "groq/qwen-2.5-32b",
  "groq/deepseek-r1-distill-qwen-32b",
  "groq/deepseek-r1-distill-llama-70b",
  // CEREBRAS
  "cerebras/llama3.3-70b",
];

// The configuration file `evals.config.json` contains a list of tasks and their associated categories.
const moduleDir = getCurrentDirPath();
const configPath = path.join(moduleDir, "evals.config.json");
const config = JSON.parse(fs.readFileSync(configPath, "utf-8")) satisfies {
  tasks: {
    name: string;
    categories: string[];
  }[];
};

/**
 * The `tasksConfig` defines all tasks from the config file. Each task has a name and categories.
 * We create a mapping `tasksByName` from task name to its categories for quick lookup.
 */
type TaskConfig = {
  name: string;
  categories: string[];
};
const tasksConfig = config.tasks as TaskConfig[];

const tasksByName = tasksConfig.reduce<
  Record<string, { categories: string[] }>
>((acc, task) => {
  acc[task.name] = {
    categories: task.categories,
  };
  return acc;
}, {});

/**
 * If filtering by a specific eval name (task), ensure that this task actually exists.
 */
if (filterByEvalName && !tasksByName[filterByEvalName]) {
  console.error(`Error: Evaluation "${filterByEvalName}" does not exist.`);
  process.exit(1);
}

/**
 * Determine which models to run the evaluations against.
 *
 * DEFAULT_EVAL_MODELS: The default set of models used for most categories.
 */
const DEFAULT_EVAL_MODELS = process.env.EVAL_MODELS
  ? process.env.EVAL_MODELS.split(",")
  : [
      "google/gemini-2.0-flash",
      "openai/gpt-4.1-mini",
      "anthropic/claude-haiku-4-5",
    ];

// Standard agent models - these run with stagehand.agent()
const AGENT_MODELS = process.env.EVAL_AGENT_MODELS
  ? process.env.EVAL_AGENT_MODELS.split(",")
  : ["anthropic/claude-sonnet-4-20250514"];

// CUA agent models - these run with stagehand.agent({ cua: true })
const AGENT_MODELS_CUA = process.env.EVAL_AGENT_MODELS_CUA
  ? process.env.EVAL_AGENT_MODELS_CUA.split(",")
  : [
      "openai/computer-use-preview-2025-03-11",
      "anthropic/claude-sonnet-4-20250514",
      "google/gemini-2.5-computer-use-preview-10-2025",
    ];

const AGENT_MODEL_ENTRIES: AgentModelEntry[] = [
  ...AGENT_MODELS.map((m) => ({ modelName: m, cua: false })),
  ...AGENT_MODELS_CUA.map((m) => ({ modelName: m, cua: true })),
];

const DEFAULT_AGENT_MODELS = AGENT_MODEL_ENTRIES.map((e) => e.modelName);

/**
 * getModelList:
 * Returns a list of models to be used for the given category.
 * If category is "experimental", it merges DEFAULT_EVAL_MODELS and EXPERIMENTAL_EVAL_MODELS.
 * Otherwise, returns DEFAULT_EVAL_MODELS filtered by provider if specified.
 */
const getModelList = (category?: string): string[] => {
  const provider = process.env.EVAL_PROVIDER?.toLowerCase();

  if (category === "agent" || category === "external_agent_benchmarks") {
    return DEFAULT_AGENT_MODELS;
  }

  if (provider) {
    return ALL_EVAL_MODELS.filter((model) =>
      filterModelByProvider(model, provider),
    );
  }

  // If no agent category and no provider, return default eval models
  return DEFAULT_EVAL_MODELS;
};

// Helper function to contain the provider filtering logic
const filterModelByProvider = (model: string, provider: string): boolean => {
  const modelLower = model.toLowerCase();
  if (provider === "openai") {
    return modelLower.startsWith("gpt");
  } else if (provider === "anthropic") {
    return modelLower.startsWith("claude");
  } else if (provider === "google") {
    return modelLower.startsWith("gemini");
  } else if (provider === "together") {
    return (
      modelLower.startsWith("meta-llama") ||
      modelLower.startsWith("llama") ||
      modelLower.startsWith("deepseek") ||
      modelLower.startsWith("qwen")
    );
  } else if (provider === "groq") {
    return modelLower.startsWith("groq");
  } else if (provider === "cerebras") {
    return modelLower.startsWith("cerebras");
  }
  console.warn(
    `Unknown provider specified or model doesn't match: ${provider}`,
  );
  return false;
};

const MODELS: AvailableModel[] = getModelList().map((model) => {
  return model as AvailableModel;
});

/**
 * Get agent model entries with CUA flag for test case generation.
 */
const getAgentModelEntries = (): AgentModelEntry[] => AGENT_MODEL_ENTRIES;

export { tasksByName, MODELS, tasksConfig, getModelList, getAgentModelEntries };
export type { AgentModelEntry };


================================================
FILE: packages/evals/tasks/agent/alibaba_supplier_search.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const alibaba_supplier_search: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.alibaba.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Search for 'solar panels' on Alibaba and find 3 suppliers. For each supplier, tell me their company name, minimum order quantity, and price range if available.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/all_recipes.ts
================================================
import { V3Evaluator } from "@browserbasehq/stagehand";
import { EvalFunction } from "../../types/evals.js";

export const all_recipes: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.allrecipes.com/");
    const evaluator = new V3Evaluator(v3);
    const agentResult = await agent.execute({
      instruction:
        "Search for a recipe for Beef Wellington on Allrecipes that has at least 200 reviews and an average rating of 4.5 stars or higher. List the main ingredients required for the dish.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    const { evaluation, reasoning } = await evaluator.ask({
      question: "Did the agent find a recipe for Beef Wellington",
    });

    logger.log(agentResult);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/amazon_shoes_cart.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const amazon_shoes_cart: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.amazon.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "go to amazon, and add a pair of black running shoes to cart in size 14. stop after you add the item to cart, and reach the login page";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/apple_trade_in.ts
================================================
//this eval is expected to fail due to issues scrolling within the trade in dialog
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const apple_trade_in: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.apple.com/shop/trade-in");
    const evaluator = new V3Evaluator(v3);
    await agent.execute({
      instruction:
        "Find out the trade-in value for an iPhone 13 Pro Max in good condition on the Apple website.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Did the agent find the trade-in value for an iPhone 13 Pro Max in good condition on the Apple website?",
      screenshot: false,
      answer: "360",
    });

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/apple_tv.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const apple_tv: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.apple.com/");

    const agentResult = await agent.execute({
      instruction:
        "Identify the size and weight for the Apple TV 4K and list the Siri Remote features introduced.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    const evaluator = new V3Evaluator(v3);
    const result = await evaluator.ask({
      question:
        "did the agent find the height and width of the Apple TV 4K in its reasoning which is 1.2 and 3.66?",
      answer: agentResult.message,
    });

    const success = result.evaluation === "YES";
    if (!success) {
      return {
        _success: false,
        message: agentResult.message,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/arxiv_gpt_report.ts
================================================
//agent often fails on this one,
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const arxiv_gpt_report: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://arxiv.org/");

    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Find the paper 'GPT-4 Technical Report', when was v3 submitted?";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 25,
    });

    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    // Mon, 27 Mar 2023 17:46:54 UTC
    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `Did the agent complete this task successfully? ${instruction}, the correct answer the agent should have provided is '03-27-2023'`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/columbia_tuition.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const columbia_tuition: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://columbia.edu/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Use the search functionality to locate pages detailing tuition and fees, then extract the published tuition fee information for undergraduate programs. Only use http://columbia.edu to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/flipkart_laptops.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const flipkart_laptops: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.flipkart.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "In the 'Laptops' section, apply the filter for 'Dell' and extract the average discount percentage on the first 3 Dell laptops displayed. Only use http://flipkart.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/gaia.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

/**
 * Data-driven GAIA agent eval
 * - Expects per-test params injected via eval runner: { id, level, web, ques }
 * - Starts at `web`, runs the agent with `ques` as instruction
 * - Requires the agent to output a final answer in the form: "Final Answer: <value>"
 * - Marks success if such an answer string is present (exact matching against dataset can be layered later)
 */
export const gaia: EvalFunction = async ({
  v3,
  logger,
  debugUrl,
  sessionUrl,
  modelName,
  input,
}) => {
  try {
    const params = ((input && input.params) || {}) as {
      id?: string;
      level?: number;
      web?: string;
      ques?: string;
    };

    if (!params.web || !params.ques) {
      logger.error({
        category: "gaia",
        level: 0,
        message: `Missing GAIA params (web, ques).`,
        auxiliary: {
          params: { value: JSON.stringify(params), type: "object" },
        },
      });
      return {
        _success: false,
        error: `Missing GAIA params (web, ques). Got: ${JSON.stringify(params)}`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    const page = v3.context.pages()[0];
    await page.goto(params.web);

    const agent = v3.agent({
      model: modelName,
      systemPrompt: `You are a helpful assistant that must solve the task by browsing. You must produce a single line at the end like: "Final Answer: <answer>". Do not ask follow up questions. Current page: ${await page.title()}`,
    });

    const result = await agent.execute({
      instruction: params.ques,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    const expected = (params as Record<string, unknown>).expected as
      | string
      | undefined;
    const evaluator = new V3Evaluator(v3);
    const evalResult = await evaluator.ask({
      question: `Did the agent provide the expected answer: "${expected}"?`,
      answer: result?.message || "",
      screenshot: false,
    });

    return {
      _success: evalResult.evaluation === "YES",
      reasoning: evalResult.reasoning,
      expectedAnswer: expected,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    logger.error({
      category: "gaia",
      level: 0,
      message: `Unhandled error in GAIA task`,
      auxiliary: {
        error: {
          value: error instanceof Error ? error.message : String(error),
          type: "string",
        },
        trace: {
          value: error instanceof Error && error.stack ? error.stack : "",
          type: "string",
        },
      },
    });
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  }
};


================================================
FILE: packages/evals/tasks/agent/github.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const github: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://github.com/");
    const evaluator = new V3Evaluator(v3);
    const agentResult = await agent.execute({
      instruction:
        "Find a Ruby repository on GitHub that has been updated in the past 3 days and has at least 1000 stars.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });
    logger.log(agentResult);

    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Ruby repository on GitHub that has been updated in the past 3 days and has at least 1000 stars.",
    });

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/github_react_version.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const github_react_version: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  v3,
  agent,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://github.com/");

    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Check the latest release version of React and the date it was published.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `Did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/google_flights.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const google_flights: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://google.com/travel/flights");

    const agentResult = await agent.execute({
      instruction:
        "Search for flights from San Francisco to New York for next weekend",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });
    logger.log(agentResult);

    const evaluator = new V3Evaluator(v3);
    const result = await evaluator.ask({
      question:
        "Does the page show flights (options, available flights, not a search form) from San Francisco to New York?",
    });

    if (result.evaluation !== "YES" && result.evaluation !== "NO") {
      return {
        _success: false,
        observations: "Evaluator provided an invalid response",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    if (result.evaluation === "YES") {
      return {
        _success: true,
        observations: result.reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    } else {
      return {
        _success: false,
        observations: result.reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/google_maps.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const google_maps: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://maps.google.com");

    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "How long does it take to get from San Francisco to New York driving?";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 15,
    });

    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `Did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/google_maps_2.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const google_maps_2: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://maps.google.com");

    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Search for the fastest walking route from La Puerta de Alcalá to La Puerta del Sol";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });

    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `Did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    if (evaluation !== "YES") {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/google_maps_3.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const google_maps_3: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://maps.google.com/");
    const evaluator = new V3Evaluator(v3);
    await agent.execute({
      instruction:
        "Search for locksmiths open now but not open 24 hours in Texas City.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 35,
    });

    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Does the page show a locksmiths open now but not open 24 hours in Texas City?",
    });

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/google_shopping.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const google_shopping: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.google.com/shopping");

    const agentResult = await agent.execute({
      instruction:
        "Find a drip coffee maker that is on sale and within $25-60 and has a black finish",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });
    logger.log(agentResult);

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Does the page show a drip coffee maker that is on sale and within $25-60 and has a black finish?",
    });

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/hotel_booking.ts
================================================
//this eval is expected to fail.
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const hotel_booking: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.booking.com/");

    const agentResult = await agent.execute({
      instruction:
        "Find a hotel in Sydney with a rating of 8 or higher, providing free Wi-Fi and parking, available for a four-night stay starting on December 10, 2025.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });
    logger.log(agentResult);

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Does the page show a hotel in Sydney with a rating of 8 or higher, providing free Wi-Fi and parking, available for a four-night stay starting on December 10, 2025?",
    });

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/hotels_paris_amenities.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const hotels_paris_amenities: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.hotels.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Filter search results for properties in Paris available next month that offer spa amenities and bars, and list the amenities of the first three hotels. Only use http://hotels.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/hugging_face.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const hugging_face: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const evaluator = new V3Evaluator(v3);
    const page = v3.context.pages()[0];
    await page.goto("https://huggingface.co/");
    const agentResult = await agent.execute({
      instruction:
        "Search for a model on Hugging Face with an Apache-2.0 license that has received the highest number of likes.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });
    console.log(`agentResult: ${agentResult.message}`);
    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Does the message mention 'kokoro-82m' or 'hexgrad/Kokoro-82M'?",
      answer: agentResult.message || "",
      screenshot: false,
    });

    const success = evaluation === "YES";

    console.log(`reasoning: ${reasoning}`);
    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/iframe_form.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const iframe_form: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-form-filling/",
    );

    const agentResult = await agent.execute({
      instruction: "Fill in the form name with 'John Smith'",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 5,
    });
    logger.log(agentResult);

    const evaluator = new V3Evaluator(v3);
    const result = await evaluator.ask({
      question: "Is the form name input filled with 'John Smith'?",
    });

    if (result.evaluation !== "YES" && result.evaluation !== "NO") {
      return {
        _success: false,
        observations: "Evaluator provided an invalid response",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const agentResult2 = await agent.execute({
      instruction: "Fill in the form email with 'john.smith@example.com'",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 3,
    });
    logger.log(agentResult2);

    await page.scroll(0, 0, 0, -1000);
    const result2 = await evaluator.ask({
      question: "Is the form email input filled with 'john.smith@example.com'?",
      screenshot: true,
    });

    if (result2.evaluation !== "YES" && result2.evaluation !== "NO") {
      return {
        _success: false,
        observations: "Evaluator provided an invalid response",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    if (result.evaluation === "YES" && result2.evaluation === "YES") {
      return {
        _success: true,
        observations: "All fields were filled correctly",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    } else {
      return {
        _success: false,
        observations: "One or more fields were not filled correctly",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/iframe_form_multiple.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const iframe_form_multiple: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-form-filling/",
    );

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Fill in the first name with 'John', the last name with 'Smith', the email with 'john.smith@example.com', and select the email radio button as preferred contact method";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 10,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `Did the agent complete this task successfully? ${instruction}. The form should have: first name = 'John', last name = 'Smith', email = 'john.smith@example.com', and the email radio button selected as preferred contact method.`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/instacart_organic_bananas.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const instacart_organic_bananas: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.instacart.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Search for organic bananas on Instacart and list the top 3 prices along with their retailer names. Only use http://instacart.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/kayak.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const kayak: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const evaluator = new V3Evaluator(v3);
    const page = v3.context.pages()[0];
    await page.goto("https://www.kayak.com");

    await agent.execute({
      instruction: "Find flights from San Francisco to Tokyo next week",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 25,
    });
    await agent.execute({
      instruction: "Sort the flights by price",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 8,
    });

    if (v3.context.pages().length !== 2) {
      return {
        _success: false,
        message: "No new pages were opened",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    const { evaluation, reasoning } = await evaluator.ask({
      question:
        "Are the flights shown sorted by price? Check the sort button in the top left corner of the page. It should show cheapest first; use this as the success criteria since the page might promote other flights and not show the list in order.",
    });

    const success = evaluation === "YES";
    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/kfc_tenders_combo.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const kfc_tenders_combo: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.kfc.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Add a 5-piece Tenders Combo to my bag with Sweet Corn as the side, Sweet Tea as the drink, and both Honey BBQ and Honey Mustard sauces. Select the store closest to Zip code 10001 for pick-up tomorrow at 12:00 PM.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/kith.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const kith: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const evaluator = new V3Evaluator(v3);
    const page = v3.context.pages()[0];
    await page.goto(
      "https://kith.com/collections/nike-air-force-1/products/nkcw2288-111?variant=19439468707968",
    );

    await agent.execute({
      instruction:
        "add the shoes to cart, go to checkout, and fill the delivery information. Don't fill the payment information",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 25,
    });

    const { evaluation, reasoning } = await evaluator.ask({
      question: "Did the agent fill the delivery information",
    });

    const success = evaluation === "YES";

    if (success) {
      await agent.execute({
        instruction:
          "fill the credit card information, do not submit the order just add placeholders",
        maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 10,
      });

      const { evaluation: evaluation2, reasoning: reasoning2 } =
        await evaluator.ask({
          question: "Did the agent fill the payment information",
        });

      const success2 = evaluation2 === "YES";

      if (success2) {
        return {
          _success: true,
          debugUrl,
          sessionUrl,
          logs: logger.getLogs(),
        };
      } else {
        return {
          _success: false,
          message: reasoning2,
          debugUrl,
          sessionUrl,
          logs: logger.getLogs(),
        };
      }
    } else {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/made_in_china_supplier.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const made_in_china_supplier: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.made-in-china.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Navigate to the suppliers profiles section, select a verified supplier offering 'electronic components', and extract the certification details provided on their profile. Only use http://made-in-china.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/nba_trades.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const nba_trades: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    const evaluator = new V3Evaluator(v3);
    await page.goto("https://www.espn.com/");

    const agentResult = await agent.execute({
      instruction:
        "Find the latest Team transaction in the NBA within the past week.",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 25,
    });
    logger.log(agentResult);

    const { evaluation, reasoning } = await evaluator.ask({
      question: "Did the agent make it to the nba transactions page?",
    });

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/nvidia_hgx_driver.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const nvidia_hgx_driver: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://nvidia.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Find the HGX H100 driver for Ubuntu 22.04 on AMD64 CPU. use https://nvidia.com/ to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/oed_word_search.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const oed_word_search: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.oed.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Filter search results to show only entries for words first used from 1500 to 1600 and list the headwords of the first 10 results. Only use http://oed.com/ to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/onlineMind2Web.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";
import { imageResize } from "../../utils/imageResize.js";

export const onlineMind2Web: EvalFunction = async ({
  v3,
  logger,
  debugUrl,
  sessionUrl,
  modelName,
  input,
}) => {
  let screenshotCollector: ScreenshotCollector | null = null;

  try {
    const params = ((input && input.params) || {}) as {
      task_id?: string;
      confirmed_task?: string;
      website?: string;
      reference_length?: number;
      level?: string;
    };

    if (!params.website || !params.confirmed_task) {
      return {
        _success: false,
        error: `Missing onlineMind2Web params (website, confirmed_task). Got: ${JSON.stringify(params)}`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    const page = v3.context.pages()[0];
    await page.goto(params.website, {
      timeoutMs: 120_000,
    });

    const agent = v3.agent({
      cua: true,
      model: modelName,
      systemPrompt: `You are a helpful assistant that must solve the task by browsing. At the end, produce a single line: "Final Answer: <answer>" summarizing the requested result (e.g., score, list, or text). Current page: ${await page.title()}. ALWAYS OPERATE WITHIN THE PAGE OPENED BY THE USER, WHICHEVER TASK YOU ARE ATTEMPTING TO COMPLETE CAN BE ACCOMPLISHED WITHIN THE PAGE.`,
    });

    screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 7,
    });
    screenshotCollector.start();

    const agentResult = await agent.execute({
      instruction: params.confirmed_task,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    // Stop collecting and get all screenshots
    let screenshots = await screenshotCollector.stop();

    // Resize screenshots if we have any
    if (screenshots.length > 0) {
      screenshots = await Promise.all(
        screenshots.map(async (screenshot) => {
          return await imageResize(screenshot, 0.7);
        }),
      );
    }

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const evalResult = await evaluator.ask({
      question: `Did the agent successfully complete this task: "${params.confirmed_task}"?`,
      screenshot: screenshots,
      agentReasoning:
        agentResult.message ||
        "no reasoning available, agent potentially hit step limit",
    });

    // Clear screenshot buffers to free memory
    screenshots.length = 0;

    return {
      _success: evalResult.evaluation === "YES",
      reasoning: evalResult.reasoning,
      task_level: params.level,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    if (screenshotCollector) {
      try {
        await screenshotCollector.stop();
      } catch {
        // Ignore errors during cleanup
      }
    }
  }
};


================================================
FILE: packages/evals/tasks/agent/radiotimes_tv_schedule.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const radiotimes_tv_schedule: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://radiotimes.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Locate tonight's featured TV schedule on Radiotimes, and list the titles of shows airing on both BBC and ITV. Only use http://radiotimes.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/redfin_apartment_rental.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const redfin_apartment_rental: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://redfin.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    // Calculate move-in date as 30 days from now
    const moveInDate = new Date();
    moveInDate.setDate(moveInDate.getDate() + 30);
    const moveInDateFormatted = moveInDate.toLocaleDateString("en-US", {
      year: "numeric",
      month: "long",
      day: "numeric",
    });

    const instruction = `Find a 2 bed and 1.5+ bath apartment listing for rent in New York, with a move in date of ${moveInDateFormatted}. use https://redfin.com/ to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.`;
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/sf_library_card.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const sf_library_card: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://sflib1.sfpl.org/selfreg");
    const agentResult = await agent.execute({
      instruction: "Fill in the 'street Address' field with '166 Geary St'",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 1,
    });
    logger.log(agentResult);
    const evaluator = new V3Evaluator(v3);
    const result = await evaluator.ask({
      question:
        "Does the page show the 'street Address' field filled with '166 Geary St'?",
    });

    if (result.evaluation !== "YES" && result.evaluation !== "NO") {
      return {
        _success: false,
        observations: "Evaluator provided an invalid response",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    if (result.evaluation === "YES") {
      return {
        _success: true,
        observations: result.reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    } else {
      return {
        _success: false,
        observations: result.reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/sf_library_card_multiple.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const sf_library_card_multiple: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://sflib1.sfpl.org/selfreg");

    const agentResult = await agent.execute({
      instruction:
        "Fill in ALL the required fields with mock data. DO NOT submit the form",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 20,
    });
    logger.log(agentResult);

    const evaluator = new V3Evaluator(v3);
    const result = await evaluator.ask({
      question: "Does the page show all the required fields filled?",
    });

    if (result.evaluation !== "YES" && result.evaluation !== "NO") {
      return {
        _success: false,
        observations: "Evaluator provided an invalid response",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    if (result.evaluation === "YES") {
      return {
        _success: true,
        observations: result.reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    } else {
      return {
        _success: false,
        observations: result.reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/sign_in.ts
================================================
import { EvalFunction } from "../../types/evals.js";

export const sign_in: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://v0-modern-login-flow.vercel.app/");

    const agentResult = await agent.execute({
      instruction:
        "Sign in with the email address 'test@browserbaser.com' and the password 'stagehand=goated' ",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 15,
    });
    logger.log(agentResult);
    const url = page.url();

    if (url === "https://v0-modern-login-flow.vercel.app/authorized") {
      return {
        _success: true,
        observations: url,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: false,
      observations: url,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/steam_games.ts
================================================
import { EvalFunction } from "../../types/evals.js";

export const steam_games: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://store.steampowered.com/");

    const agentResult = await agent.execute({
      instruction:
        "Show most played games in Steam. And tell me the number of players in game at this time",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    //strictly used url check and no extract as the top games / players can vary
    const success = page.url().includes("https://store.steampowered.com/");

    if (!success) {
      return {
        _success: false,
        message: agentResult.message,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/thegamer_opinion_article.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const thegamer_opinion_article: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.thegamer.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Locate an Opinion or Cultural Commentary article discussing modern gaming culture and summarize its central argument in one or two sentences. Only use http://thegamer.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 30,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/trailhead_superbadge.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const trailhead_superbadge: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://trailhead.salesforce.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Find the tasks needed to complete the Assess Your Access & Security Skills category in the secure your app trailhead";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/trivago.ts
================================================
import { EvalFunction } from "../../types/evals.js";

export const trivago: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.trivago.com/");

    const agentResult = await agent.execute({
      instruction:
        "Find the cheapest room in the hotel H10 Tribeca in Madrid next weekend. Stop at the trivago page showing the results",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 13,
    });
    logger.log(agentResult);

    const url = page.url();

    if (
      url.includes("hotel-h10-tribeca-madrid") &&
      url.includes("trivago.com")
    ) {
      return {
        _success: true,
        observations: url,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    } else {
      return {
        _success: false,
        observations: url,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/trustpilot_hr_companies.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const trustpilot_hr_companies: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://trustpilot.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Use Trustpilot's search function to filter HR & Recruiting located in 'London', then list the review summaries for the first three companies listed above 4.5 stars. Only use http://trustpilot.com to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/ubereats.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";

export const ubereats: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const evaluator = new V3Evaluator(v3);
    const page = v3.context.pages()[0];
    await page.goto("https://www.ubereats.com/");

    await agent.execute({
      instruction:
        "Order a pizza from ubereats to 639 geary st in sf, call the task complete once the login page is shown after adding pizza and viewing the cart",
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 35,
    });

    const { evaluation, reasoning } = await evaluator.ask({
      question: "Did the agent make it to the login page?",
    });

    const success =
      evaluation === "YES" && page.url().includes("https://auth.uber.com/");
    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/uniqlo_mens_blazers.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const uniqlo_mens_blazers: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.uniqlo.com");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Show me the list of Men's Blazers, Black, Size M on Uniqlo.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/webmd_audiologist_search.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const webmd_audiologist_search: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://doctor.webmd.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Find the best Audiologist within 50 miles of New York, NY, with a rating of 4 and above. use https://doctor.webmd.com/ to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/webmd_ovulation_calculator.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";

export const webmd_ovulation_calculator: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  logger,
  agent,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.webmd.com/");

    // Start collecting screenshots throughout the agent's journey
    const screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 15,
    });
    screenshotCollector.start();

    const instruction =
      "Search for the ovulation calculator and enter Mar 1 as the first date of the period and calculate the date of ovulation and pregnancy test day. use https://www.webmd.com/ to achieve the task. Don't go to any other site. The task is achievable with just navigation from this site.";
    const agentResult = await agent.execute({
      instruction,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 40,
    });

    // Stop and collect all screenshots from the journey
    const screenshots = await screenshotCollector.stop();

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const { evaluation, reasoning } = await evaluator.ask({
      question: `did the agent complete this task successfully? ${instruction}`,
      screenshot: screenshots,
      agentReasoning: agentResult.message,
    });

    console.log(`reasoning: ${reasoning}`);

    const success = evaluation === "YES";

    if (!success) {
      return {
        _success: false,
        message: reasoning,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    const errorMessage = error instanceof Error ? error.message : String(error);
    return {
      _success: false,
      message: errorMessage,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/agent/webtailbench.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";
import { imageResize } from "../../utils/imageResize.js";

export const webtailbench: EvalFunction = async ({
  v3,
  logger,
  debugUrl,
  sessionUrl,
  modelName,
  input,
}) => {
  let screenshotCollector: ScreenshotCollector | null = null;

  try {
    const params = ((input && input.params) || {}) as {
      id?: string;
      category?: string;
      ques?: string;
      web?: string;
    };

    if (!params.ques) {
      return {
        _success: false,
        error: `Missing webtailbench params (ques). Got: ${JSON.stringify(params)}`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const page = v3.context.pages()[0];
    // web field is always empty in WebTailBench; start from Google
    const startUrl = params.web || "https://www.google.com";
    await page.goto(startUrl, {
      timeoutMs: 120_000,
    });

    const agent = v3.agent({
      cua: true,
      model: modelName,
      systemPrompt: `You are a helpful assistant that must solve the task by browsing. At the end, produce a single line: "Final Answer: <answer>" summarizing the requested result (e.g., score, list, or text). Current page: ${await page.title()}. You will need to navigate to the appropriate website to complete the task.`,
    });

    screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 8,
    });
    screenshotCollector.start();

    const agentResult = await agent.execute({
      instruction: params.ques,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    // Stop collecting and get all screenshots
    let screenshots = await screenshotCollector.stop();

    // Resize screenshots if we have any
    if (screenshots.length > 0) {
      screenshots = await Promise.all(
        screenshots.map(async (screenshot) => {
          return await imageResize(screenshot, 0.7);
        }),
      );
    }

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const evalResult = await evaluator.ask({
      question: `Did the agent successfully complete this task: "${params.ques}"? Note that the agent does not have purchasing/booking capabilities; mark as pass if the agent has successfully performed all necessary steps for the task up to the point of purchasing/booking/entering payment/user information`,
      screenshot: screenshots,
      agentReasoning:
        agentResult.message ||
        "no reasoning available, agent potentially hit step limit",
    });

    // Clear screenshot buffers to free memory
    screenshots.length = 0;

    return {
      _success: evalResult.evaluation === "YES",
      reasoning: evalResult.reasoning,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    if (screenshotCollector) {
      try {
        await screenshotCollector.stop();
      } catch {
        // Ignore errors during cleanup
      }
    }
  }
};


================================================
FILE: packages/evals/tasks/agent/webvoyager.ts
================================================
import { EvalFunction } from "../../types/evals.js";
import { V3Evaluator } from "@browserbasehq/stagehand";
import { ScreenshotCollector } from "../../utils/ScreenshotCollector.js";
import { imageResize } from "../../utils/imageResize.js";

export const webvoyager: EvalFunction = async ({
  v3,
  logger,
  debugUrl,
  sessionUrl,
  modelName,
  input,
}) => {
  let screenshotCollector: ScreenshotCollector | null = null;

  try {
    const params = ((input && input.params) || {}) as {
      id?: string;
      web?: string;
      ques?: string;
      web_name?: string;
    };

    if (!params.web || !params.ques) {
      return {
        _success: false,
        error: `Missing WebVoyager params (web, ques). Got: ${JSON.stringify(params)}`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const page = v3.context.pages()[0];
    await page.goto(params.web, {
      timeoutMs: 120_000,
    });

    const agent = v3.agent({
      model: modelName,
      systemPrompt: `You are a helpful assistant that must solve the task by browsing. At the end, produce a single line: "Final Answer: <answer>" summarizing the requested result (e.g., score, list, or text). Current page: ${await page.title()}`,
    });

    screenshotCollector = new ScreenshotCollector(v3, {
      interval: 3000,
      maxScreenshots: 7,
    });
    screenshotCollector.start();

    const agentResult = await agent.execute({
      instruction: params.ques,
      maxSteps: Number(process.env.AGENT_EVAL_MAX_STEPS) || 50,
    });

    // Stop collecting and get all screenshots
    let screenshots = await screenshotCollector.stop();

    // Resize screenshots if we have any
    if (screenshots.length > 0) {
      screenshots = await Promise.all(
        screenshots.map(async (screenshot) => {
          return await imageResize(screenshot, 0.7);
        }),
      );
    }

    logger.log({
      category: "evaluation",
      message: `Collected ${screenshots.length} screenshots for evaluation`,
      level: 1,
    });

    const evaluator = new V3Evaluator(v3);
    const evalResult = await evaluator.ask({
      question: `Did the agent successfully complete this task: "${params.ques}"?`,
      screenshot: screenshots,
      agentReasoning:
        agentResult.message ||
        "no reasoning available, agent potentially hit step limit",
    });

    // Clear screenshot buffers to free memory
    screenshots.length = 0;

    return {
      _success: evalResult.evaluation === "YES",
      reasoning: evalResult.reasoning,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    if (screenshotCollector) {
      try {
        await screenshotCollector.stop();
      } catch {
        // Ignore errors during cleanup
      }
    }
  }
};


================================================
FILE: packages/evals/tasks/allrecipes.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const allrecipes: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.allrecipes.com/", {
      waitUntil: "domcontentloaded",
    });

    await v3.act('Type "chocolate chip cookies" in the search bar');
    await v3.act("press enter");

    const recipeDetails = await v3.extract(
      "Extract the title of the first recipe and the total number of ratings it has received.",
      z.object({
        title: z.string().describe("Title of the recipe"),
        total_ratings: z
          .string()
          .describe("Total number of ratings for the recipe"),
      }),
    );

    const { title, total_ratings } = recipeDetails;
    const expectedTitle = "Best Chocolate Chip Cookies";
    const expectedRatings = 19164;

    const extractedRatings = parseInt(total_ratings.replace(/[^\d]/g, ""), 10);
    const isRatingsWithinRange =
      extractedRatings >= expectedRatings - 1000 &&
      extractedRatings <= expectedRatings + 1000;

    if (title !== expectedTitle || !isRatingsWithinRange) {
      const errors = [];
      if (title !== expectedTitle) {
        errors.push({
          message: "Extracted title does not match the expected title",
          expected: expectedTitle,
          actual: title,
        });
      }
      if (!isRatingsWithinRange) {
        errors.push({
          message: "Extracted ratings are not within the expected range",
          expected: `${expectedRatings} ± 1000`,
          actual: extractedRatings.toString(),
        });
      }

      logger.error({
        message: "Failed to extract correct recipe details",
        level: 0,
        auxiliary: {
          errors: {
            value: JSON.stringify(errors),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Recipe details extraction validation failed",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      recipeDetails: {
        title,
        total_ratings: extractedRatings,
      },
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      message: "Recipe details extraction validation failed",
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/amazon_add_to_cart.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const amazon_add_to_cart: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/amazon/",
    );

    await v3.act("click the 'Add to Cart' button");

    await v3.act("click the 'Proceed to checkout' button");

    const currentUrl = page.url();
    const expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/amazon/sign-in.html";

    console.log("currentUrl", currentUrl);
    console.log("expectedUrl", expectedUrl);
    return {
      _success: currentUrl === expectedUrl,
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/apple.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const apple: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.apple.com/iphone-16-pro/");

    await v3.act("click on the buy button");
    await v3.act("select the Pro Max model");
    await v3.act("select the natural titanium color");
    await v3.act("select the 256GB storage option");
    await v3.act("click on the 'select a smartphone' trade-in option");

    await v3.act("select the iPhone 13 mini model from the dropdown");
    await v3.act("select the iPhone 13 mini is in good condition");

    const successMessageLocator = page.locator(
      'text="Good News. Your iPhone 13 mini qualifies for credit."',
    );
    const isVisible = await successMessageLocator.isVisible();

    return {
      _success: isVisible,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/arxiv.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const arxiv: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://arxiv.org/search/");

    await v3.act("type web agents with multimodal models in the search bar");

    await v3.act("hit enter");

    const paper_links = await v3.extract(
      "extract the titles and links for two papers",
      z.object({
        papers: z
          .array(
            z.object({
              title: z.string().describe("the title of the paper"),
              link: z.string().url().describe("the link to the paper"),
            }),
          )
          .describe("list of papers"),
      }),
    );

    if (
      !paper_links ||
      !paper_links.papers ||
      paper_links.papers.length === 0
    ) {
      return {
        _success: false,
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const papers = [];
    for (const paper of paper_links.papers) {
      if (paper.link) {
        await page.goto(paper.link);
        const abstract = await v3.extract(
          "extract details of the paper from the abstract",
          z.object({
            category: z
              .string()
              .describe(
                "the category of the paper. one of {'Benchmark', 'Dataset', 'Model', 'Framework', 'System', 'Other'}",
              ),
            problem: z
              .string()
              .describe(
                "summarize the problem that the paper is trying to solve in one sentence",
              )
              .nullable(),
            methodology: z
              .string()
              .describe(
                "summarize the methodology of the paper in one sentence",
              )
              .nullable(),
            results: z
              .string()
              .describe("summarize the results of the paper in one sentence")
              .nullable(),
            conclusion: z
              .string()
              .describe("summarize the conclusion of the paper in one sentence")
              .nullable(),
            code: z
              .string()
              .describe(
                "if provided, extract only the link to the code repository, without additional text. this is often optional and not always provided.",
              )
              .nullable(),
          }),
        );

        papers.push({
          title: paper.title,
          link: paper.link,
          ...abstract,
        });
      }
    }

    if (!papers || papers.length === 0) {
      return {
        _success: false,
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (papers.length !== 2) {
      logger.error({
        message: "incorrect number of papers extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: "2",
            type: "integer",
          },
          actual: {
            value: papers.length.toString(),
            type: "integer",
          },
        },
      });

      return {
        _success: false,
        error: "Incorrect number of papers extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    // Ensure that every paper has a problem and methodology
    for (const paper of papers) {
      if (!paper.problem || !paper.methodology) {
        logger.error({
          message: `paper missing problem or methodology`,
          level: 0,
          auxiliary: {
            paper: {
              value: JSON.stringify(paper),
              type: "object",
            },
          },
        });

        return {
          _success: false,
          error: "Incomplete paper information",
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
        };
      }
    }

    return {
      _success: true,
      papers,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    logger.error({
      message: `error in arxiv function`,
      level: 0,
      auxiliary: {
        error: {
          value: error.message,
          type: "string",
        },
        trace: {
          value: error.stack,
          type: "string",
        },
      },
    });

    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/bidnet.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const bidnet: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.bidnetdirect.com/");

    await v3.act('Click on the "Construction" keyword');

    const expectedUrl =
      "https://www.bidnetdirect.com/public/solicitations/open?keywords=Construction";
    const currentUrl = page.url();

    return {
      _success: currentUrl.startsWith(expectedUrl),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/checkboxes.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const checkboxes: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/checkboxes/",
    );

    await v3.act("click the 'baseball' option");

    await v3.act("click the 'netball' option");

    const baseballChecked = await page
      .locator('input[type="checkbox"][name="sports"][value="baseball"]')
      .isChecked();

    const netballChecked = await page
      .locator('input[type="checkbox"][name="sports"][value="netball"]')
      .isChecked();

    return {
      _success: baseballChecked && netballChecked,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (e) {
    return {
      _success: false,
      error: e,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/combination_sauce.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const combination_sauce: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.saucedemo.com/");

    const { usernames, password } = await v3.extract(
      "extract the accepted usernames and the password for login",
      z.object({
        usernames: z.array(z.string()).describe("the accepted usernames"),
        password: z.string().describe("the password for login"),
      }),
    );

    await v3.act(`enter username 'standard_user'`);

    await v3.act(`enter password '${password}'`);

    await v3.act("click on 'login'");

    const observations = await v3.observe("find all the 'add to cart' buttons");

    const url = page.url();

    const usernamesCheck = usernames.length === 6;
    const urlCheck = url === "https://www.saucedemo.com/inventory.html";
    const observationsCheck = observations.length === 6;

    return {
      _success: usernamesCheck && urlCheck && observationsCheck,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/costar.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const costar: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.costar.com/");

    await v3.act("click on the first article");

    await v3.act("click on the learn more button for the first job");

    const articleTitle = await v3.extract(
      "extract the title of the article",
      z.object({
        title: z.string().describe("the title of the article").nullable(),
      }),
    );

    logger.log({
      message: "got article title",
      level: 1,
      auxiliary: {
        articleTitle: {
          value: JSON.stringify(articleTitle),
          type: "object",
        },
      },
    });

    // Check if the title is more than 5 characters
    const isTitleValid =
      articleTitle.title !== null && articleTitle.title.length > 5;

    await v3.close();

    return {
      title: articleTitle.title,
      _success: isTitleValid,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    logger.error({
      message: "error in costar function",
      level: 0,
      auxiliary: {
        error: {
          value: error.message,
          type: "string",
        },
        trace: {
          value: error.stack,
          type: "string",
        },
      },
    });

    return {
      title: null,
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/csr_in_oopif.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const csr_in_oopif: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // click inside an CSR (closed mode shadow) root that is inside an
  // OOPIF (out of process iframe)

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/closed-shadow-root-in-oopif/",
    );
    await v3.act("click the button");

    await new Promise((resolve) => setTimeout(resolve, 1000));
    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        message: `successfully clicked the button`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to click on the button`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/csr_in_spif.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const csr_in_spif: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // click inside an CSR (closed mode shadow) root that is inside an
  // SPIF (same process iframe)

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/closed-shadow-dom-in-spif/",
    );
    await v3.act("click the button");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        message: `successfully clicked the button`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to click on the button`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/custom_dropdown.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const custom_dropdown: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  /**
   * This eval is meant to test whether we do not incorrectly attempt
   * the selectOptionFromDropdown method (defined in actHandlerUtils.ts) on a
   * 'dropdown' that is not a <select> element.
   *
   * This kind of dropdown must be clicked to be expanded before being interacted
   * with.
   */

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/expand-dropdown/",
    );

    await v3.act("choose Canada from the 'Select a Country' dropdown");

    // to test, we'll grab the full a11y tree, and make sure it contains 'Canada'
    const extraction = await v3.extract();
    const fullTree = extraction.pageText;

    if (fullTree.includes("Canada")) {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: "unable to expand the dropdown",
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error attempting to select an option from the dropdown: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/dropdown.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const dropdown: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/dropdown/",
    );

    // click the dropdown element to expand it
    const xpath = "xpath=/html/body/div/div/button";
    await page.locator(xpath).click();

    // type into the input box (which should be hidden behind the
    // expanded dropdown)
    await v3.act("type 'test fill' into the input field");

    const input = page.locator(`xpath=/html/body/div/input`);
    const expectedValue = "test fill";

    // get the value of the input box
    const actualValue = await input.inputValue();

    // pass if the value matches expected
    return {
      _success: actualValue === expectedValue,
      expectedValue,
      actualValue,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_aigrant_companies.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_aigrant_companies: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    const companyList = await v3.extract(
      "Extract all companies that received the AI grant and group them with their batch numbers as an array of objects. Each object should contain the company name and its corresponding batch number.",
      z.object({
        companies: z.array(
          z.object({
            company: z.string(),
            batch: z.string(),
          }),
        ),
      }),
    );
    const companies = companyList.companies;
    const expectedLength = 91;

    const expectedFirstItem = {
      company: "Goodfire",
      batch: "4",
    };

    const expectedLastItem = {
      company: "Forefront",
      batch: "1",
    };

    if (companies.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of companies extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: companies.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of companies extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }
    const firstItemMatches =
      companies[0].company === expectedFirstItem.company &&
      companies[0].batch === expectedFirstItem.batch;

    if (!firstItemMatches) {
      logger.error({
        message: "First company extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedFirstItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(companies[0]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "First company extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const lastItemMatches =
      companies[companies.length - 1].company === expectedLastItem.company &&
      companies[companies.length - 1].batch === expectedLastItem.batch;

    if (!lastItemMatches) {
      logger.error({
        message: "Last company extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedLastItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(companies[companies.length - 1]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Last company extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_aigrant_targeted.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_aigrant_targeted: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    const selector = "/html/body/div/ul[5]/li[28]";
    const company = await v3.extract(
      "Extract the company name.",
      z.object({
        company_name: z.string(),
      }),
      { selector: selector },
    );

    const companyName = company.company_name;

    const expectedName = {
      company_name: "Coframe",
    };

    const nameMatches = companyName == expectedName.company_name;

    if (!nameMatches) {
      logger.error({
        message: "extracted company name does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedName.company_name,
            type: "string",
          },
          actual: {
            value: companyName,
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Company name does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_aigrant_targeted_2.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_aigrant_targeted_2: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    const selector = "/html/body/div/ul[5]/li[28]";
    const company = await v3.extract(
      "Extract the name of the company that comes after 'Coframe'.",
      z.object({
        company_name: z.string(),
      }),
      { selector: selector },
    );
    const companyName = company.company_name;

    // nameWeShouldNotGet matches the name of the company that comes after
    // CoFrame on the website. Since we are using targeted_extract here,
    // and passing in a selector that does NOT contain the nameWeShouldNotGet,
    // the LLM should have no visibility into what comes after 'CoFrame' if
    // targeted_extract is performing correctly
    const nameWeShouldNotGet = {
      company_name: "OpusClip",
    };

    const nameMatches = companyName == nameWeShouldNotGet.company_name;

    if (nameMatches) {
      logger.error({
        message:
          "extracted company name matches the company name that we SHOULD NOT get",
        level: 0,
        auxiliary: {
          expected: {
            value: nameWeShouldNotGet.company_name,
            type: "string",
          },
          actual: {
            value: companyName,
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error:
          "extracted company name matches the company name that we SHOULD NOT get",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_apartments.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_apartments: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.apartments.com/san-francisco-ca/2-bedrooms/", {
      waitUntil: "load",
    });
    const apartment_listings = await v3.extract(
      "Extract all the apartment listings with their prices and their addresses.",
      z.object({
        listings: z.array(
          z.object({
            price: z.string().describe("The price of the listing"),
            address: z.string().describe("The address of the listing"),
          }),
        ),
      }),
    );

    const listings = apartment_listings.listings;
    const expectedLength = 40;

    if (listings.length < expectedLength) {
      logger.error({
        message: "Incorrect number of listings extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: listings.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of listings extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_area_codes.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_area_codes: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/ncc-area-codes/",
      { waitUntil: "domcontentloaded" },
    );

    const result = await v3.extract(
      "Extract ALL the Primary Center names and their corresponding Area Code, and the name of their corresponding Zone.",
      z.object({
        primary_center_list: z.array(
          z.object({
            zone_name: z
              .string()
              .describe(
                "The name of the Zone that the Primary Center is in. For example, 'North Central Zone'.",
              ),
            primary_center_name: z
              .string()
              .describe(
                "The name of the Primary Center. I.e., this is the name of the city or town.",
              ),
            area_code: z
              .string()
              .describe(
                "The area code for the Primary Center. This will either be 2 or 3 digits.",
              ),
          }),
        ),
      }),
    );

    const primaryCenterList = result.primary_center_list;
    const expectedLength = 56;

    const expectedFirstItem = {
      zone_name: "Lagos Zone",
      primary_center_name: "Lagos",
      area_code: "01",
    };

    const expectedLastItem = {
      zone_name: "South-East",
      primary_center_name: "Yenagoa",
      area_code: "089",
    };

    if (primaryCenterList.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of primary centers extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: primaryCenterList.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of primary centers extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }
    const firstItemMatches =
      primaryCenterList[0].zone_name === expectedFirstItem.zone_name &&
      primaryCenterList[0].primary_center_name ===
        expectedFirstItem.primary_center_name &&
      primaryCenterList[0].area_code === expectedFirstItem.area_code;

    if (!firstItemMatches) {
      logger.error({
        message: "First primary center extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedFirstItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(primaryCenterList[0]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "First primary center extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const lastItemMatches =
      primaryCenterList[primaryCenterList.length - 1].zone_name ===
        expectedLastItem.zone_name &&
      primaryCenterList[primaryCenterList.length - 1].primary_center_name ===
        expectedLastItem.primary_center_name &&
      primaryCenterList[primaryCenterList.length - 1].area_code ===
        expectedLastItem.area_code;

    if (!lastItemMatches) {
      logger.error({
        message: "Last primary center extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedLastItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(
              primaryCenterList[primaryCenterList.length - 1],
            ),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Last primary center extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_baptist_health.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { compareStrings } from "../utils.js";
import { z } from "zod";

export const extract_baptist_health: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/baptist-health/",
    );

    const result = await v3.extract(
      "Extract the address, phone number, and fax number of the healthcare location.",
      z.object({
        address: z.string(),
        phone: z.string(),
        fax: z.string(),
      }),
    );

    const { address, phone, fax } = result;
    const expected = {
      address: "2055 East South Blvd; Suite 908 Montgomery, AL 36116",
      phone: "334-747-2273",
      fax: "334-747-7501",
    };

    const similarityThreshold = 0.85;
    const failedFields: Array<{
      field: string;
      similarity: number;
      expected: string;
      actual: string;
    }> = [];

    const compareField = (
      actualVal: string,
      expectedVal: string,
      fieldName: string,
    ) => {
      const { similarity, meetsThreshold } = compareStrings(
        actualVal,
        expectedVal,
        similarityThreshold,
      );

      if (!meetsThreshold) {
        failedFields.push({
          field: fieldName,
          similarity,
          expected: expectedVal,
          actual: actualVal,
        });
        logger.error({
          message: `${fieldName} extracted does not meet similarity threshold`,
          level: 0,
          auxiliary: {
            field: { value: fieldName, type: "string" },
            similarity: { value: similarity.toFixed(2), type: "string" },
            expected: { value: expectedVal, type: "string" },
            actual: { value: actualVal, type: "string" },
          },
        });
      }

      return meetsThreshold;
    };

    const addressOk = compareField(address, expected.address, "Address");
    const phoneOk = compareField(phone, expected.phone, "Phone number");
    const faxOk = compareField(fax, expected.fax, "Fax number");

    if (!addressOk || !phoneOk || !faxOk) {
      return {
        _success: false,
        error: "Some fields did not meet similarity threshold",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
        failedFields,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_capacitor_info.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { normalizeString } from "../utils.js";
import { z } from "zod";

export const extract_capacitor_info: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/capacitor/",
    );

    const result = await v3.extract(
      "Extract the ECCN Code, RoHS Status, and Impedance.",
      z.object({
        ECCN_code: z.string(),
        RoHS_Status: z.string(),
        Impedance: z.string(),
      }),
    );

    const { ECCN_code, RoHS_Status, Impedance } = result;

    const expected = {
      ECCN_code: "EAR99",
      RoHS_Status: "RoHS Compliant",
      Impedance: "12mOhm",
    };

    if (normalizeString(ECCN_code) !== normalizeString(expected.ECCN_code)) {
      logger.error({
        message: "ECCN code extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.ECCN_code),
            type: "string",
          },
          actual: {
            value: normalizeString(ECCN_code),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "ECCN code extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (
      normalizeString(RoHS_Status) !== normalizeString(expected.RoHS_Status)
    ) {
      logger.error({
        message: "RoHS Status extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.RoHS_Status),
            type: "string",
          },
          actual: {
            value: normalizeString(RoHS_Status),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "RoHS Status extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (normalizeString(Impedance) !== normalizeString(expected.Impedance)) {
      logger.error({
        message: "Impedance extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.Impedance),
            type: "string",
          },
          actual: {
            value: normalizeString(Impedance),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Impedance extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_collaborators.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_collaborators: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://github.com/facebook/react");
    await v3.act("find and click the contributors section");

    await v3.act("scroll halfway down the page");

    const { contributors } = await v3.extract(
      "Extract top 5 contributors of this repository",
      z.object({
        contributors: z.array(
          z.object({
            github_username: z
              .string()
              .describe("the github username of the contributor"),
            commits: z.number().describe("number of commits contributed"),
          }),
        ),
      }),
    );

    const EXPECTED_CONTRIBUTORS = [
      "zpao",
      "gaearon",
      "sebmarkbage",
      "acdlite",
      "sophiebits",
    ];
    return {
      _success:
        contributors.length === EXPECTED_CONTRIBUTORS.length &&
        contributors.every(
          (c, i) =>
            EXPECTED_CONTRIBUTORS[i] === c.github_username && c.commits >= 1000,
        ),
      contributors,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_csa.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_csa: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/csa/",
    );

    const result = await v3.extract(
      "Extract all the publications on the page including the publication date, session type, publication type, and annotation",
      z.object({
        publications: z.array(
          z.object({
            publication_date: z.string(),
            session_type: z.string(),
            publication_type: z.string(),
            annotation: z.string(),
          }),
        ),
      }),
    );

    const publications = result.publications;
    const expectedLength = 14;

    const expectedFirstItem = {
      publication_date: "11-30-2024",
      session_type: "Regular Session",
      publication_type: "Assembly Weekly History",
      annotation:
        "2024 -- This publication includes the complete histories of second-year bills. The complete electronic history of all bills is always available at leginfo.legislature.ca.gov",
    };

    const expectedLastItem = {
      publication_date: "11-30-2016",
      session_type: "1st Extraordinary Session",
      publication_type: "Assembly Weekly History",
      annotation: "",
    };

    if (publications.length < expectedLength) {
      logger.error({
        message: "Incorrect number of publications extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: `>= ${expectedLength}`,
            type: "integer",
          },
          actual: {
            value: publications.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of publications extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const hasExpectedFirstItem = publications.some((publication) => {
      return (
        publication.publication_date === expectedFirstItem.publication_date &&
        publication.session_type === expectedFirstItem.session_type &&
        publication.publication_type === expectedFirstItem.publication_type &&
        publication.annotation === expectedFirstItem.annotation
      );
    });

    if (!hasExpectedFirstItem) {
      logger.error({
        message: "Expected 'first' item not found in publications",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedFirstItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(publications),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Expected 'first' item not found in publications",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const hasExpectedLastItem = publications.some((publication) => {
      return (
        publication.publication_date === expectedLastItem.publication_date &&
        publication.session_type === expectedLastItem.session_type &&
        publication.publication_type === expectedLastItem.publication_type &&
        publication.annotation === expectedLastItem.annotation
      );
    });

    if (!hasExpectedLastItem) {
      logger.error({
        message: "Expected 'last' item not found in publications",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedLastItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(publications),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Expected 'last' item not found in publications",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_geniusee.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_geniusee: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/geniusee/",
    );
    const selector = "/html/body/main/div[2]/div[2]/div[2]/table";
    const scalability = await v3.extract(
      "Extract the scalability comment in the table for Gemini (Google)",
      z.object({
        scalability: z.string(),
      }),
      { selector: selector },
    );

    const scalabilityComment = scalability.scalability;

    const expectedScalabilityComment = {
      scalability: "Scalable architecture with API access",
    };

    const commentMatches =
      scalabilityComment == expectedScalabilityComment.scalability;

    if (!commentMatches) {
      logger.error({
        message: "extracted scalability comment does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedScalabilityComment.scalability,
            type: "string",
          },
          actual: {
            value: scalabilityComment,
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "extracted scalability comment does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_geniusee_2.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_geniusee_2: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/geniusee/",
    );
    const selector = "/html/body/main/div[2]/div[2]/div[2]/table/tbody/tr[9]";
    const scalability = await v3.extract(
      "Extract the scalability comment in the table for Gemini (Google)",
      z.object({
        scalability: z.string(),
      }),
      { selector: selector },
    );

    const scalabilityComment = scalability.scalability;

    // scalabilityCommentWeShouldNotGet matches a scalability comment in the table,
    // but since we are using targeted_extract here,
    // and passing in a selector that does NOT contain the scalabilityCommentWeShouldNotGet,
    // the LLM should have no visibility into scalabilityCommentWeShouldNotGet if
    // targeted_extract is performing correctly
    const scalabilityCommentWeShouldNotGet = {
      scalability: "Scalable architecture with API access",
    };

    const commentMatches =
      scalabilityComment == scalabilityCommentWeShouldNotGet.scalability;

    if (commentMatches) {
      logger.error({
        message:
          "extracted scalability comment matches the scalability comment that we SHOULD NOT get",
        level: 0,
        auxiliary: {
          expected: {
            value: scalabilityCommentWeShouldNotGet.scalability,
            type: "string",
          },
          actual: {
            value: scalabilityComment,
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error:
          "scalability comment matches the scalability comment that we SHOULD NOT get",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_github_commits.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_github_commits: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://github.com/facebook/react");

    await v3.act(
      "find commit history, generally described by the number of commits",
    );
    const { commits } = await v3.extract(
      "Extract last 20 commits",
      z.object({
        commits: z.array(
          z.object({
            commit_message: z.string(),
            commit_url: z.string(),
            commit_hash: z.string(),
          }),
        ),
      }),
    );

    logger.log({
      message: "Extracted commits",
      level: 1,
      auxiliary: {
        commits: {
          value: JSON.stringify(commits),
          type: "object",
        },
      },
    });

    return {
      _success: commits.length === 20,
      commits,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_github_stars.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_github_stars: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://github.com/facebook/react");

    const { stars } = await v3.extract(
      "Extract the number of stars for the project",
      z.object({
        stars: z.number().describe("the number of stars for the project"),
      }),
    );

    const expectedStarsString = await page
      .locator("#repo-stars-counter-star")
      .first()
      .innerHtml();

    const expectedStars = expectedStarsString.toLowerCase().endsWith("k")
      ? parseFloat(expectedStarsString.slice(0, -1)) * 1000
      : parseFloat(expectedStarsString);

    const tolerance = 1000;
    const isWithinTolerance = Math.abs(stars - expectedStars) <= tolerance;

    return {
      _success: isWithinTolerance,
      stars,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_hamilton_weather.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";
import { compareStrings } from "../utils.js";

export const extract_hamilton_weather: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/hamilton-weather/",
    );
    const xpath =
      "/html/body[1]/div[5]/main[1]/article[1]/div[6]/div[2]/div[1]/table[1]";

    const weatherData = await v3.extract(
      "extract the weather data for Sun, Feb 23 at 11PM",
      z.object({
        temperature: z.string(),
        weather_description: z.string(),
        wind: z.string(),
        humidity: z.string(),
        barometer: z.string(),
        visibility: z.string(),
      }),
      { selector: xpath },
    );

    // Define the expected weather data
    const expectedWeatherData = {
      temperature: "27 °F",
      weather_description: "Light snow. Overcast.",
      wind: "6 mph",
      humidity: "93%",
      barometer: '30.07 "Hg',
      visibility: "10 mi",
    };

    // Check that every field matches the expected value
    const isWeatherCorrect =
      compareStrings(
        weatherData.temperature,
        expectedWeatherData.temperature,
        0.9,
      ).meetsThreshold &&
      compareStrings(
        weatherData.weather_description,
        expectedWeatherData.weather_description,
        0.9,
      ).meetsThreshold &&
      compareStrings(weatherData.wind, expectedWeatherData.wind, 0.9)
        .meetsThreshold &&
      compareStrings(weatherData.humidity, expectedWeatherData.humidity, 0.9)
        .meetsThreshold &&
      compareStrings(weatherData.barometer, expectedWeatherData.barometer, 0.9)
        .meetsThreshold &&
      compareStrings(
        weatherData.visibility,
        expectedWeatherData.visibility,
        0.9,
      ).meetsThreshold;

    return {
      _success: isWeatherCorrect,
      weatherData,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_jfk_links.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_jfk_links: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/jfk/",
    );

    const extraction = await v3.extract(
      "extract all the record file name and their corresponding links",
      z.object({
        records: z.array(
          z.object({
            file_name: z.string().describe("the file name of the record"),
            link: z.string().url(),
          }),
        ),
      }),
    );

    // The list of records we expect to see
    const expectedRecords = [
      {
        file_name: "104-10003-10041.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10003-10041.pdf",
      },
      {
        file_name: "104-10004-10143 (C06932208).pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10004-10143%20(C06932208).pdf",
      },
      {
        file_name: "104-10004-10143.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10004-10143.pdf",
      },
      {
        file_name: "104-10004-10156.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10004-10156.pdf",
      },
      {
        file_name: "104-10004-10213.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10004-10213.pdf",
      },
      {
        file_name: "104-10005-10321.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10005-10321.pdf",
      },
      {
        file_name: "104-10006-10247.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10006-10247.pdf",
      },
      {
        file_name: "104-10007-10345.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10007-10345.pdf",
      },
      {
        file_name: "104-10009-10021.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10009-10021.pdf",
      },
      {
        file_name: "104-10009-10222.pdf",
        link: "https://www.archives.gov/files/research/jfk/releases/2025/0318/104-10009-10222.pdf",
      },
    ];

    const extractedRecords = extraction.records;

    // Check that all expected records exist in the extraction
    const missingRecords = expectedRecords.filter((expected) => {
      return !extractedRecords.some(
        (r) => r.file_name === expected.file_name && r.link === expected.link,
      );
    });

    // Check that the extraction array is exactly length 10
    if (extractedRecords.length !== 10) {
      return {
        _success: false,
        reason: `Extraction has ${extractedRecords.length} records (expected 10).`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    if (missingRecords.length > 0) {
      return {
        _success: false,
        reason: "Missing one or more expected records.",
        missingRecords,
        extractedRecords,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    // If we reach here, the number of records is correct, and all are present
    return {
      _success: true,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_jstor_news.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_jstor_news: EvalFunction = async ({
  logger,

  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/jstor/",
      {
        waitUntil: "load",
      },
    );
    await v3.act("close the cookie");

    const result = await v3.extract(
      "Extract ALL the news report titles and their dates.",
      z.object({
        reports: z.array(
          z.object({
            report_name: z
              .string()
              .describe("The name or title of the news report."),
            publish_date: z
              .string()
              .describe("The date the news report was published."),
          }),
        ),
      }),
    );

    const reports = result.reports;
    const expectedLength = 10;

    const expectedFirstItem = {
      report_name: "JSTOR retires Publisher Sales Service",
      publish_date: "December 9, 2024",
    };

    const expectedLastItem = {
      report_name: "Path to Open announces 2024 titles",
      publish_date: "May 10, 2024",
    };

    if (reports.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of reports extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: reports.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of reports extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }
    const firstItemMatches =
      reports[0].report_name === expectedFirstItem.report_name &&
      reports[0].publish_date === expectedFirstItem.publish_date;

    if (!firstItemMatches) {
      logger.error({
        message: "First report extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedFirstItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(reports[0]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "First report extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const lastItemMatches =
      reports[reports.length - 1].report_name ===
        expectedLastItem.report_name &&
      reports[reports.length - 1].publish_date ===
        expectedLastItem.publish_date;

    if (!lastItemMatches) {
      logger.error({
        message: "Last report extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedLastItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(reports[reports.length - 1]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Last report extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_memorial_healthcare.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";
import { compareStrings } from "../utils.js";

export const extract_memorial_healthcare: EvalFunction = async ({
  logger,

  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/mycmh/",
    );

    const result = await v3.extract(
      "extract a list of the first three healthcare centers on this page, with their name, full address, and phone number",
      z.object({
        health_centers: z.array(
          z.object({
            name: z.string(),
            phone_number: z.string(),
            address: z.string(),
          }),
        ),
      }),
    );

    const health_centers: Array<
      Partial<{ name: string; phone_number: string; address: string }>
    > = result.health_centers;

    const expectedLength = 3;
    const similarityThreshold = 0.85;

    const expectedFirstItem = {
      name: "Community Memorial Breast Center",
      phone_number: "805-948-5093",
      address: "168 North Brent Street, Suite 401, Ventura, CA 93003",
    };

    const expectedLastItem = {
      name: "Community Memorial Dermatology and Mohs Surgery",
      phone_number: "805-948-6920",
      address: "168 North Brent Street, Suite 403, Ventura, CA 93003",
    };

    if (health_centers.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of health centers extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: health_centers.length.toString(),
            type: "integer",
          },
        },
      });

      return {
        _success: false,
        error: "Incorrect number of health centers extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const validateHealthCenter = (
      center: Partial<{ name: string; phone_number: string; address: string }>,
    ): { name: string; phone_number: string; address: string } | null => {
      if (center.name && center.phone_number && center.address) {
        return center as {
          name: string;
          phone_number: string;
          address: string;
        };
      }
      logger.error({
        message: "Invalid health center data",
        level: 0,
        auxiliary: {
          center: { value: JSON.stringify(center), type: "object" },
        },
      });
      return null;
    };

    const validHealthCenters = health_centers
      .map(validateHealthCenter)
      .filter(Boolean) as Array<{
      name: string;
      phone_number: string;
      address: string;
    }>;

    if (validHealthCenters.length < expectedLength) {
      return {
        _success: false,
        error: "One or more health centers have missing fields",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const compareField = (
      actual: string,
      expected: string,
      fieldName: string,
    ): boolean => {
      const { similarity, meetsThreshold } = compareStrings(
        actual,
        expected,
        similarityThreshold,
      );

      if (!meetsThreshold) {
        logger.error({
          message: `Field "${fieldName}" does not meet similarity threshold`,
          level: 0,
          auxiliary: {
            field: { value: fieldName, type: "string" },
            similarity: { value: similarity.toFixed(2), type: "float" },
            expected: { value: expected, type: "string" },
            actual: { value: actual, type: "string" },
          },
        });
      }

      return meetsThreshold;
    };

    const compareItem = (
      actual: { name: string; phone_number: string; address: string },
      expected: { name: string; phone_number: string; address: string },
      position: string,
    ): boolean => {
      const fields = [
        { field: "name", actual: actual.name, expected: expected.name },
        {
          field: "phone_number",
          actual: actual.phone_number,
          expected: expected.phone_number,
        },
        {
          field: "address",
          actual: actual.address,
          expected: expected.address,
        },
      ];

      return fields.every(({ field, actual, expected }) =>
        compareField(actual, expected, `${position} ${field}`),
      );
    };

    const firstItemMatches = compareItem(
      validHealthCenters[0],
      expectedFirstItem,
      "First",
    );
    const lastItemMatches = compareItem(
      validHealthCenters[validHealthCenters.length - 1],
      expectedLastItem,
      "Last",
    );

    if (!firstItemMatches || !lastItemMatches) {
      return {
        _success: false,
        error: "One or more fields do not match expected values",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_nhl_stats.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { normalizeString } from "../utils.js";
import { z } from "zod";

export const extract_nhl_stats: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://www.hockeydb.com/ihdb/stats/top_league.php?lid=nhl1927&sid=1990",
      {
        waitUntil: "domcontentloaded",
      },
    );

    const result = await v3.extract(
      "Extract the name of the goal scoring leader, their number of goals they scored, and the team they played for.",
      z.object({
        name: z.string(),
        num_goals: z.string(),
        team: z.string(),
      }),
    );

    const { name, num_goals, team } = result;

    const expected = {
      name: "Brett Hull",
      num_goals: "72",
      team: "St. Louis",
    };

    if (normalizeString(name) !== normalizeString(expected.name)) {
      logger.error({
        message: "Player name extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.name),
            type: "string",
          },
          actual: {
            value: normalizeString(name),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Player name extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (normalizeString(num_goals) !== normalizeString(expected.num_goals)) {
      logger.error({
        message: "Number of goals extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.num_goals),
            type: "string",
          },
          actual: {
            value: normalizeString(num_goals),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Number of goals extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (normalizeString(team) !== normalizeString(expected.team)) {
      logger.error({
        message: "Player team extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.team),
            type: "string",
          },
          actual: {
            value: normalizeString(team),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Player team extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_partners.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_partners: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://ramp.com");

    await v3.act("scroll to the bottom of the page");

    await v3.act("Close the popup.");

    await v3.act("click on the link that leads to the partners page.");

    const partners = await v3.extract(
      `Extract all of the partner categories on the page.`,
      z.object({
        partners: z.array(
          z.object({
            partner_category: z.string().describe("The partner category"),
          }),
        ),
        explanation: z
          .string()
          .optional()
          .describe("Any explanation about partner listing or absence thereof"),
      }),
    );

    const expectedPartners = [
      "Accounting Partners",
      "Private Equity & Venture Capital Partners",
      "Services Partners",
      "Affiliates",
    ];

    const foundPartners = partners.partners.map((partner) =>
      partner.partner_category.toLowerCase(),
    );

    const allExpectedPartnersFound = expectedPartners.every((partner) =>
      foundPartners.includes(partner.toLowerCase()),
    );

    return {
      _success: allExpectedPartnersFound,
      partners,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    logger.error({
      message: "error in extractPartners function",
      level: 0,
      auxiliary: {
        error: {
          value: error.message,
          type: "string",
        },
        trace: {
          value: error.stack,
          type: "string",
        },
      },
    });

    return {
      _success: false,
      debugUrl,
      sessionUrl,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_press_releases.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";
import { compareStrings } from "../utils.js";

export const extract_press_releases: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  const schema = z.object({
    items: z.array(
      z.object({
        title: z.string().describe("The title of the press release"),
        publish_date: z
          .string()
          .describe("The date the press release was published"),
      }),
    ),
  });

  type PressRelease = z.infer<typeof schema>["items"][number];

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/press-releases/",
    );
    await new Promise((resolve) => setTimeout(resolve, 5000));

    const rawResult = await v3.extract(
      "extract the title and corresponding publish date of EACH AND EVERY press releases on this page. DO NOT MISS ANY PRESS RELEASES.",
      schema,
    );

    const parsed = schema.parse(rawResult);
    const { items } = parsed;

    const expectedLength = 28;
    const expectedFirstItem: PressRelease = {
      title: "UAW Region 9A Endorses Brad Lander for Mayor",
      publish_date: "Dec 4, 2024",
    };
    const expectedLastItem: PressRelease = {
      title: "Fox Sued by New York City Pension Funds Over Election Falsehoods",
      publish_date: "Nov 12, 2023",
    };

    if (items.length <= expectedLength) {
      logger.error({
        message: "Not enough items extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: `> ${expectedLength}`,
            type: "string",
          },
          actual: {
            value: items.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Not enough items extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const isItemMatch = (item: PressRelease, expected: PressRelease) => {
      const titleComparison = compareStrings(item.title, expected.title, 0.9);
      const dateComparison = compareStrings(
        item.publish_date,
        expected.publish_date,
        0.9,
      );
      return titleComparison.meetsThreshold && dateComparison.meetsThreshold;
    };

    const foundFirstItem = items.some((item) =>
      isItemMatch(item, expectedFirstItem),
    );
    const foundLastItem = items.some((item) =>
      isItemMatch(item, expectedLastItem),
    );

    return {
      _success: foundFirstItem && foundLastItem,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    logger.error({
      message: `Error in extract_press_releases function`,
      level: 0,
      auxiliary: {
        error: {
          value: (error as Error).message || JSON.stringify(error),
          type: "string",
        },
        trace: {
          value: (error as Error).stack,
          type: "string",
        },
      },
    });
    return {
      _success: false,
      error: "An error occurred during extraction",
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_professional_info.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { normalizeString } from "../utils.js";
import { z } from "zod";

export const extract_professional_info: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/professional-info/",
    );

    const result = await v3.extract(
      "Extract the list of Practices, phone number, and fax number of the professional.",
      z.object({
        practices: z.array(z.string()),
        phone: z.string(),
        fax: z.string(),
      }),
    );

    await v3.close();

    const { practices, phone, fax } = result;

    const expected = {
      practices: [
        "Restructuring",
        "Finance",
        "Hybrid Capital & Special Situations",
        "Private Credit",
      ],
      phone: "+1-212-373-3262",
      fax: "+1-212-492-0262",
    };

    if (
      JSON.stringify(practices.map(normalizeString)) !==
      JSON.stringify(expected.practices.map(normalizeString))
    ) {
      logger.error({
        message: "Practices extracted do not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expected.practices),
            type: "object",
          },
          actual: {
            value: JSON.stringify(practices),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Practices extracted do not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (normalizeString(phone) !== normalizeString(expected.phone)) {
      logger.error({
        message: "Phone number extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.phone),
            type: "string",
          },
          actual: {
            value: normalizeString(phone),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Phone number extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (normalizeString(fax) !== normalizeString(expected.fax)) {
      logger.error({
        message: "Fax number extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.fax),
            type: "string",
          },
          actual: {
            value: normalizeString(fax),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Fax number extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_public_notices.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";
import { compareStrings } from "../utils.js";

export const extract_public_notices: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/sars/",
      { waitUntil: "load" },
    );

    const result = await v3.extract(
      "Extract ALL the public notice descriptions with their corresponding, GG number and publication date. Extract ALL notices from 2024 through 2020. Do not include the Notice number.",
      z.object({
        public_notices: z.array(
          z.object({
            notice_description: z
              .string()
              .describe(
                "the description of the notice. Do not include the Notice number",
              ),
            gg_number: z
              .string()
              .describe("the GG number of the notice. For example, GG 12345"),
            publication_date: z
              .string()
              .describe(
                "the publication date of the notice. For example, 8 December 2021",
              ),
          }),
        ),
      }),
    );

    const publicNotices = result.public_notices;
    const expectedLength = 24;

    const expectedFirstItem = {
      notice_description:
        "Additional considerations in terms of section 80(2) in respect of which an application for a binding private ruling or a binding class ruling may be rejected",
      gg_number: "GG 51526",
      publication_date: "8 November 2024",
    };

    const expectedLastItem = {
      notice_description:
        "Notice in terms of section 25, read with section 66(1) of the Income Tax Act, 1962, for submission of 2020 income tax returns",
      gg_number: "GG 43495",
      publication_date: "3 July 2020",
    };

    if (publicNotices.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of public notices extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: publicNotices.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of public notices extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }
    const firstItemMatches =
      compareStrings(
        publicNotices[0].notice_description,
        expectedFirstItem.notice_description,
        0.9,
      ) &&
      compareStrings(
        publicNotices[0].gg_number,
        expectedFirstItem.gg_number,
        0.9,
      ) &&
      compareStrings(
        publicNotices[0].publication_date,
        expectedFirstItem.publication_date,
        0.9,
      );

    if (!firstItemMatches) {
      logger.error({
        message: "First public notice extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedFirstItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(publicNotices[0]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "First public notice extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const lastItemMatches =
      compareStrings(
        publicNotices[publicNotices.length - 1].notice_description,
        expectedLastItem.notice_description,
        0.9,
      ) &&
      compareStrings(
        publicNotices[publicNotices.length - 1].gg_number,
        expectedLastItem.gg_number,
        0.9,
      ) &&
      compareStrings(
        publicNotices[publicNotices.length - 1].publication_date,
        expectedLastItem.publication_date,
        0.9,
      );

    if (!lastItemMatches) {
      logger.error({
        message: "Last public notice extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedLastItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(publicNotices[publicNotices.length - 1]),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: "Last public notice extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_recipe.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_recipe: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/allrecipes-extract/",
      {
        waitUntil: "domcontentloaded",
      },
    );

    const selector = "/html/body/main/article/div[3]/div[3]/div[4]";
    const recipeDetails = await v3.extract(
      "Extract the title of the number of tablespoons of olive oil needed for the steak, and the number of teaspoons of lemon juice needed for the mushroom pan sauce.",
      z.object({
        tablespoons_olive_oil: z
          .number()
          .describe(
            "the number of tablespoons of olive oil needed for the steak",
          ),
        teaspoons_lemon_juice: z
          .number()
          .describe(
            "the number of teaspoons of lemon juice needed for the mushroom pan sauce",
          ),
      }),
      { selector: selector },
    );

    const { tablespoons_olive_oil, teaspoons_lemon_juice } = recipeDetails;
    const expectedTablespoons = 2;
    const expectedTeaspoons = 2;

    if (
      tablespoons_olive_oil !== expectedTablespoons ||
      teaspoons_lemon_juice !== expectedTeaspoons
    ) {
      const errors = [];
      if (tablespoons_olive_oil !== expectedTablespoons) {
        errors.push({
          message:
            "Extracted tablespoons of olive oil do not match the extracted tablespoons of olive oil",
          expected: expectedTablespoons.toString(),
          actual: tablespoons_olive_oil.toString(),
        });
      }
      if (teaspoons_lemon_juice !== expectedTeaspoons) {
        errors.push({
          message:
            "Extracted teaspoons of lemon juice do not match the extracted teaspoons of lemon juice",
          expected: expectedTeaspoons.toString(),
          actual: teaspoons_lemon_juice.toString(),
        });
      }

      logger.error({
        message: "Failed to extract correct recipe details",
        level: 0,
        auxiliary: {
          errors: {
            value: JSON.stringify(errors),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Recipe details extraction validation failed",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      recipeDetails: {
        tablespoons_olive_oil: expectedTablespoons,
        teaspoons_lemon_juice: expectedTeaspoons,
      },
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_regulations_table.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_regulations_table: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/ncc-numbering-plan/",
    );

    const xpath =
      "/html/body/div[3]/main/div[2]/div[2]/div/div/div[2]/article/div[2]/div[1]/div/table";

    const allottees = await v3.extract(
      "Extract ALL of the Allottees and their corresponding name, area, and area code.",
      z.object({
        allottee_list: z.array(
          z.object({
            allottee_name: z.string(),
            area: z.string(),
            area_code: z.string(),
            access_code: z.string(),
          }),
        ),
      }),
      { selector: xpath },
    );

    // Define the expected weather data
    const allottees_expected_first = {
      allottee_name: "101 Communications Limited",
      area: "Lagos",
      area_code: "0201",
      access_code: "249",
    };

    const allottees_expected_last = {
      allottee_name: "Airtel Networks Limited",
      area: "National",
      area_code: "0708",
      access_code: "708",
    };

    const expected_length = 25;

    const allotteeList = allottees.allottee_list;

    // Check that the first entry, last entry, and total number match expectations
    const isFirstCorrect =
      JSON.stringify(allotteeList[0]) ===
      JSON.stringify(allottees_expected_first);
    const isLastCorrect =
      JSON.stringify(allotteeList[allotteeList.length - 1]) ===
      JSON.stringify(allottees_expected_last);
    const isLengthCorrect = allotteeList.length === expected_length;

    const isRegulationsCorrect =
      isFirstCorrect && isLastCorrect && isLengthCorrect;

    return {
      _success: isRegulationsCorrect,
      regulationsData: allottees,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_repo_name.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const extract_repo_name: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://github.com/facebook/react");

    const { extraction } = await v3.extract(
      "extract the title of the Github repository. Do not include the owner of the repository.",
    );

    logger.log({
      message: "Extracted repo title",
      level: 1,
      auxiliary: {
        repo_name: {
          value: extraction,
          type: "object",
        },
      },
    });

    return {
      _success: extraction === "react",
      extraction,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_resistor_info.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { normalizeString } from "../utils.js";
import { z } from "zod";

export const extract_resistor_info: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/resistor/",
    );

    const result = await v3.extract(
      "Extract the manufacturer standard lead time, tolerance percentage, resistance, and operating temperature range of the resistor.",
      z.object({
        manufacturer_standard_lead_time: z.string(),
        tolerance_percentage: z.string(),
        resistance: z.string(),
        operating_temperature_range: z.string(),
      }),
    );

    const {
      manufacturer_standard_lead_time,
      tolerance_percentage,
      resistance,
      operating_temperature_range,
    } = result;

    const expected = {
      manufacturer_standard_lead_time: "11 Weeks",
      tolerance_percentage: "±5",
      resistance: "330 ohms",
      operating_temperature_range: "-55°C ~ 155°C",
    };

    if (
      normalizeString(manufacturer_standard_lead_time) !==
      normalizeString(expected.manufacturer_standard_lead_time)
    ) {
      logger.error({
        message:
          "manufacturer standard lead time extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.manufacturer_standard_lead_time),
            type: "string",
          },
          actual: {
            value: normalizeString(manufacturer_standard_lead_time),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error:
          "manufacturer standard lead time extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (
      normalizeString(tolerance_percentage) !==
      normalizeString(expected.tolerance_percentage)
    ) {
      logger.error({
        message: "Tolerance percentage extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.tolerance_percentage),
            type: "string",
          },
          actual: {
            value: normalizeString(tolerance_percentage),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Tolerance percentage extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (normalizeString(resistance) !== normalizeString(expected.resistance)) {
      logger.error({
        message: "resistance extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.resistance),
            type: "string",
          },
          actual: {
            value: normalizeString(resistance),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "resistance extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    if (
      normalizeString(operating_temperature_range) !==
      normalizeString(expected.operating_temperature_range)
    ) {
      logger.error({
        message:
          "Operating temperature range extracted does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: normalizeString(expected.operating_temperature_range),
            type: "string",
          },
          actual: {
            value: normalizeString(operating_temperature_range),
            type: "string",
          },
        },
      });
      return {
        _success: false,
        error: "Operating temperature range extracted does not match expected",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_rockauto.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_rockauto: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/rockauto/",
    );
    await new Promise((resolve) => setTimeout(resolve, 5000));
    const result = await v3.extract(
      "Extract the part number of all the coolant and antifreeze products in the 'economy' category. " +
        "Do not include the manufacturer name. Do not include products from the premium category.",
      z.object({
        coolant_products: z.array(
          z.object({
            part_number: z.string(),
          }),
        ),
      }),
    );

    const coolantProducts = result.coolant_products;
    const expectedPartNumbers = [
      "GREEN5050GAL",
      "719009",
      "AF3300",
      "AF3100",
      "MV5050GAL",
    ];
    const expectedLength = expectedPartNumbers.length;

    if (coolantProducts.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of coolant products extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: coolantProducts.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of coolant products extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const missingParts = expectedPartNumbers.filter(
      (expectedPart) =>
        !coolantProducts.some((p) => p.part_number === expectedPart),
    );

    if (missingParts.length > 0) {
      logger.error({
        message: "Missing expected part number(s)",
        level: 0,
        auxiliary: {
          missingParts: {
            value: JSON.stringify(missingParts),
            type: "object",
          },
          actualExtracted: {
            value: JSON.stringify(coolantProducts),
            type: "object",
          },
        },
      });
      return {
        _success: false,
        error: `One or more expected part numbers were not found: ${missingParts.join(", ")}`,
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_single_link.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const extract_single_link: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/geniusee/",
    );

    const extraction = await v3.extract(
      "extract the link to the 'contact us' page",
      z.object({
        link: z.string().url(),
      }),
    );
    const extractedLink = extraction.link;
    const expectedLink =
      "https://browserbase.github.io/stagehand-eval-sites/sites/geniusee/#contact";

    if (extractedLink === expectedLink) {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      reason: `Extracted link: ${extractedLink} does not match expected link: ${expectedLink}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_snowshoeing_destinations.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_snowshoeing_destinations: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://www.cbisland.com/blog/10-snowshoeing-adventures-on-cape-breton-island/",
    );

    await v3.act("accept the cookies");

    const snowshoeing_regions = await v3.extract(
      "Extract all the snowshoeing regions and the names of the trails within each region.",
      z.object({
        snowshoeing_regions: z.array(
          z.object({
            region_name: z
              .string()
              .describe("The name of the snowshoeing region"),
            trails: z
              .array(
                z.object({
                  trail_name: z.string().describe("The name of the trail"),
                }),
              )
              .describe("The list of trails available in this region."),
          }),
        ),
      }),
    );

    logger.log({
      message: "Extracted destinations and trails",
      level: 1,
      auxiliary: {
        destinations: {
          value: JSON.stringify(snowshoeing_regions),
          type: "object",
        },
      },
    });

    const _success = snowshoeing_regions.snowshoeing_regions.length === 10;

    return {
      _success,
      snowshoeing_regions,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    logger.error({
      message: "Error in extract_snowshoeing_destinations function",
      level: 0,
      auxiliary: {
        error: {
          value: error.message,
          type: "string",
        },
        trace: {
          value: error.stack,
          type: "string",
        },
      },
    });
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_staff_members.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_staff_members: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/panamcs/",
    );

    const result = await v3.extract(
      "extract a list of ALL the staff members on this page, with their name and their job title",
      z.object({
        staff_members: z.array(
          z.object({
            name: z.string(),
            job_title: z.string(),
          }),
        ),
      }),
    );

    const staff_members = result.staff_members;

    const expectedLength = 50;

    const expectedFirstItem = {
      name: "Louis Alvarez",
      job_title: "School Resource Officer",
    };

    const expectedLastItem = {
      name: "Jessica Zipin",
      job_title: "School Based Therapist",
    };

    if (staff_members.length !== expectedLength) {
      logger.error({
        message: "Incorrect number of items extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: staff_members.length.toString(),
            type: "integer",
          },
        },
      });

      return {
        _success: false,
        error: "Incorrect number of staff members extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    // Check for the presence of the expected items
    const firstItemExists = staff_members.some(
      (member) =>
        member.name === expectedFirstItem.name &&
        member.job_title === expectedFirstItem.job_title,
    );

    if (!firstItemExists) {
      logger.error({
        message: "Expected first staff member not found in extracted data",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedFirstItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(staff_members),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Expected first staff member not found in extracted data",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const lastItemExists = staff_members.some(
      (member) =>
        member.name === expectedLastItem.name &&
        member.job_title === expectedLastItem.job_title,
    );

    if (!lastItemExists) {
      logger.error({
        message: "Expected last staff member not found in extracted data",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedLastItem),
            type: "object",
          },
          actual: {
            value: JSON.stringify(staff_members),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Expected last staff member not found in extracted data",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/extract_zillow.ts
================================================
import { z } from "zod";
import { EvalFunction } from "../types/evals.js";

export const extract_zillow: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/zillow/",
    );

    const real_estate_listings = await v3.extract(
      "Extract EACH AND EVERY HOME PRICE AND ADDRESS ON THE PAGE. DO NOT MISS ANY OF THEM.",
      z.object({
        listings: z.array(
          z.object({
            price: z.string().describe("The price of the home"),
            trails: z.string().describe("The address of the home"),
          }),
        ),
      }),
    );

    await v3.close();
    const listings = real_estate_listings.listings;
    const expectedLength = 38;

    if (listings.length < expectedLength) {
      logger.error({
        message: "Incorrect number of listings extracted",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedLength.toString(),
            type: "integer",
          },
          actual: {
            value: listings.length.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Incorrect number of listings extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/google_flights.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { Action } from "@browserbasehq/stagehand";

/**
 * This eval attempts to click on an element that should not pass the playwright actionability check
 * which happens by default if you call locator.click (more information here:
 * https://playwright.dev/docs/actionability)
 *
 * If this eval passes, it means that we have correctly set {force: true} in performPlaywrightMethod,
 * and the click was successful even though the target element (found by the xpath) did not
 * pass the actionability check.
 */

export const google_flights: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/google-flights/",
    );

    const observeResult: Action = {
      selector:
        "xpath=/html/body/c-wiz[2]/div/div[2]/c-wiz/div[1]/c-wiz/div[2]/div[2]/div[2]/div/div[2]/div[1]/ul/li[1]/div/div[1]",
      description: "the first departing flight",
      method: "click",
      arguments: [],
    };
    await v3.act(observeResult);

    const expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/google-flights/return-flight.html";
    const currentUrl = page.url();

    await v3.close();

    if (currentUrl === expectedUrl) {
      return {
        _success: true,
        currentUrl,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      error: "The current URL does not match expected.",
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/heal_custom_dropdown.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const heal_custom_dropdown: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  /**
   * This eval is meant to test whether we do not incorrectly attempt
   * the selectOptionFromDropdown method (defined in actHandlerUtils.ts) on a
   * 'dropdown' that is not a <select> element.
   *
   * This kind of dropdown must be clicked to be expanded before being interacted
   * with.
   */

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/expand-dropdown/",
    );

    await v3.act({
      description: "The 'Select a country' dropdown",
      selector: "/html/not-a-dropdown",
      arguments: [],
      method: "click",
    });

    // we are expecting stagehand to click the dropdown to expand it,
    // and therefore the available options should now be contained in the full
    // a11y tree.

    // to test, we'll grab the full a11y tree, and make sure it contains 'Canada'
    const extraction = await v3.extract();
    const fullTree = extraction.pageText;

    if (fullTree.includes("Canada")) {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: "unable to expand the dropdown",
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error attempting to select an option from the dropdown: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/heal_scroll_50.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const heal_scroll_50: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    await v3.act({
      description: "the element to scroll on",
      selector: "/html/body/div/div/button",
      arguments: ["50%"],
      method: "scrollTo",
    });

    await new Promise((resolve) => setTimeout(resolve, 5000));

    // Get the current scroll position and total scroll height
    const scrollInfo = await page.evaluate(() => {
      return {
        scrollTop: window.scrollY + window.innerHeight / 2,
        scrollHeight: document.documentElement.scrollHeight,
      };
    });

    const halfwayScroll = scrollInfo.scrollHeight / 2;
    const halfwayReached =
      Math.abs(scrollInfo.scrollTop - halfwayScroll) <= 200;
    const evaluationResult = halfwayReached
      ? {
          _success: true,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
        }
      : {
          _success: false,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Scroll position (${scrollInfo.scrollTop}px) is not halfway down the page (${halfwayScroll}px).`,
        };

    return evaluationResult;
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/heal_simple_google_search.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const heal_simple_google_search: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/google/",
    );

    await v3.act({
      description: "The search bar",
      selector: "/html/not-the-search-bar",
      arguments: ["OpenAI"],
      method: "fill",
    });

    await v3.act("press enter");

    const expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/google/openai.html";
    const currentUrl = page.url();

    return {
      _success: currentUrl.startsWith(expectedUrl),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/hidden_input_dropdown.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const hidden_input_dropdown: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  /**
   * This eval is meant to test whether we do not incorrectly attempt
   * the selectOptionFromDropdown method (defined in actHandlerUtils.ts) on a
   * hidden input 'dropdown'.
   *
   * This kind of dropdown must be clicked to be expanded before being interacted
   * with.
   */

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/hidden-input-dropdown/",
    );

    await v3.act("click to expand the 'Favourite Colour' dropdown");

    // we are expecting stagehand to click the dropdown to expand it,
    // and therefore the available options should now be contained in the full
    // a11y tree.

    // to test, we'll grab the full a11y tree, and make sure it contains 'Green'
    const extraction = await v3.extract();
    const fullTree = extraction.pageText;

    if (fullTree.includes("Green")) {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: "unable to expand the dropdown",
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error attempting click to expand the dropdown: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/history.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const history: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://docs.stagehand.dev");
    await v3.act("click on the 'Quickstart' tab");
    await v3.extract("Extract the title of the page");
    await v3.observe("Find all links on the page");

    const history = await v3.history;

    const hasCorrectNumberOfEntries = history.length === 4;

    const hasNavigateEntry = history[0].method === "navigate";
    const hasActEntry = history[1].method === "act";
    const hasExtractEntry = history[2].method === "extract";
    const hasObserveEntry = history[3].method === "observe";

    const allEntriesHaveTimestamps = history.every(
      (entry) =>
        typeof entry.timestamp === "string" && entry.timestamp.length > 0,
    );
    const allEntriesHaveResults = history.every(
      (entry) => entry.result !== undefined,
    );

    const success =
      hasCorrectNumberOfEntries &&
      hasNavigateEntry &&
      hasActEntry &&
      hasExtractEntry &&
      hasObserveEntry &&
      allEntriesHaveTimestamps &&
      allEntriesHaveResults;

    return {
      _success: success,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/homedepot.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const homedepot: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.homedepot.com/");
    await v3.act("enter 'gas grills' in the search bar");
    await v3.act("press enter");
    await v3.act("click on the best selling gas grill");
    await v3.act("click on the Product Details");

    const productSpecs = await v3.extract(
      "Extract the Primary exact Burner BTU of the product",
      z.object({
        productSpecs: z.object({
          burnerBTU: z.number().describe("Primary Burner BTU exact value"),
        }),
      }),
    );

    logger.log({
      message: `gas grill primary burner BTU`,
      level: 1,
      auxiliary: {
        productSpecs: {
          value: JSON.stringify(productSpecs),
          type: "object",
        },
      },
    });

    if (!productSpecs || !productSpecs.productSpecs) {
      return {
        _success: false,
        productSpecs,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const isLargerThan1000 = productSpecs.productSpecs.burnerBTU >= 10000;

    return {
      _success: isLargerThan1000,
      productSpecs,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    logger.error({
      message: "error in homedepot function",
      level: 0,
      auxiliary: {
        error: {
          value: error.message,
          type: "string",
        },
        trace: {
          value: error.stack,
          type: "string",
        },
      },
    });

    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/iframe_form_filling.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const iframe_form_filling: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-form-filling/",
    );

    await v3.act("type 'nunya' into the 'first name' field");
    await v3.act("type 'business' into the 'last name' field");
    await v3.act("type 'test@email.com' into the 'email' field");
    await v3.act("click 'phone' as the preferred contact method");
    await v3.act("type 'yooooooooooooooo' into the message box");

    const iframe = page.frameLocator("iframe");

    const firstNameValue: string = await iframe
      .locator('input[placeholder="Jane"]')
      .inputValue();

    const lastNameValue: string = await iframe
      .locator('input[placeholder="Doe"]')
      .inputValue();

    const emailValue: string = await iframe
      .locator('input[placeholder="jane@example.com"]')
      .inputValue();

    const contactValue: boolean = await iframe
      .locator("xpath=/html/body/main/section[1]/form/fieldset/label[2]/input")
      .isChecked();

    const messageValue: string = await iframe
      .locator('textarea[placeholder="Say hello…"]')
      .inputValue();

    const passed: boolean =
      firstNameValue.toLowerCase().trim() === "nunya" &&
      lastNameValue.toLowerCase().trim() === "business" &&
      emailValue.toLowerCase() === "test@email.com" &&
      messageValue.toLowerCase() === "yooooooooooooooo" &&
      contactValue;

    return {
      _success: passed,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/iframe_hn.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const iframe_hn: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-hn/",
    );

    const result = await v3.extract(
      "extract the title of the first hackernews story",
      z.object({
        story_title: z.string(),
      }),
    );

    const title = result.story_title.toLowerCase();
    const expectedTitleSubstring = "overengineered anchor links";

    if (!title.includes(expectedTitleSubstring)) {
      logger.error({
        message: `Extracted title: ${title} does not contain expected substring: ${expectedTitleSubstring}`,
        level: 0,
      });
      return {
        _success: false,
        error: `Extracted title: ${title} does not contain expected substring: ${expectedTitleSubstring}`,
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/iframe_same_proc.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const iframe_same_proc: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-same-proc/",
    );

    await v3.act("type 'stagehand' into the 'your name' field");

    // overly specific prompting is okay here. we are just trying to evaluate whether
    // we are properly traversing iframes
    await v3.act(
      "select 'Green' from the favorite colour dropdown. Ensure the word 'Green' is capitalized. Choose the selectOption method.",
    );

    const iframe = page.frameLocator("iframe");

    const nameValue: string = await iframe
      .locator('input[placeholder="Alice"]')
      .inputValue();

    const colorValue: string = await iframe.locator("select").inputValue();

    const passed: boolean =
      nameValue.toLowerCase().trim() === "stagehand" &&
      colorValue.toLowerCase().trim() === "green";

    return {
      _success: passed,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/iframe_scroll.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const iframe_scroll: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-same-proc-scroll/",
    );
    await v3.act("scroll down 50% inside the iframe");

    const frames = page.frames();
    const frame = frames[1];

    await new Promise((resolve) => setTimeout(resolve, 5000));

    // Get the current scroll position and total scroll height
    const scrollInfo = await frame.evaluate(() => {
      return {
        scrollTop: window.scrollY + window.innerHeight / 2,
        scrollHeight: document.documentElement.scrollHeight,
      };
    });

    const halfwayScroll = scrollInfo.scrollHeight / 2;
    const halfwayReached = Math.abs(scrollInfo.scrollTop - halfwayScroll) <= 1;
    const evaluationResult = halfwayReached
      ? {
          _success: true,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
        }
      : {
          _success: false,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Scroll position (${scrollInfo.scrollTop}px) is not halfway down the page (${halfwayScroll}px).`,
        };

    return evaluationResult;
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/iframes_nested.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const iframes_nested: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/nested-iframes/",
    );

    await v3.act("type 'stagehand' into the 'username' field");

    const inner = page
      .frameLocator("iframe.lvl1") // level 1
      .frameLocator("iframe.lvl2") // level 2
      .frameLocator("iframe.lvl3"); // level 3 – form lives here

    const usernameText = await inner
      .locator('input[name="username"]')
      .inputValue();

    const passed: boolean = usernameText.toLowerCase().trim() === "stagehand";

    return {
      _success: passed,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/imdb_movie_details.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const imdb_movie_details: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.imdb.com/title/tt0111161/", {
      waitUntil: "domcontentloaded",
    });
    await v3.act("click on the movie ratings");

    const movieDetails = await v3.extract(
      "Extract the list of countries with the most ratings.",
      z.object({
        countries: z
          .array(z.string())
          .describe("List of countries with the most ratings"),
      }),
    );

    const expectedCountries = [
      "United States",
      "United Kingdom",
      "Turkey",
      "India",
      "Germany",
    ];

    if (!movieDetails.countries || movieDetails.countries.length !== 5) {
      logger.error({
        message: "Failed to extract exactly five countries",
        level: 0,
        auxiliary: {
          expected: {
            value: JSON.stringify(expectedCountries),
            type: "object",
          },
          actual: {
            value: JSON.stringify(movieDetails.countries || []),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Incorrect number of countries extracted",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const missingCountries = expectedCountries.filter(
      (country) => !movieDetails.countries.includes(country),
    );

    if (missingCountries.length > 0) {
      logger.error({
        message: "Extracted countries do not match expected countries",
        level: 0,
        auxiliary: {
          missing: {
            value: JSON.stringify(missingCountries),
            type: "object",
          },
          extracted: {
            value: JSON.stringify(movieDetails.countries),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Extracted countries do not match expected countries",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      countries: movieDetails.countries,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/instructions.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const instructions: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];

    await page.goto("https://docs.browserbase.com/");

    await v3.act("secret12345");

    await page.waitForLoadState("domcontentloaded");

    const url = page.url();

    const isCorrectUrl =
      (await url) ===
      "https://docs.browserbase.com/introduction/what-is-browserbase";

    return {
      _success: isCorrectUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/ionwave.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const ionwave: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/ionwave/",
    );

    await v3.act('Click on "Closed Bids"');

    const expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/ionwave/closed-bids.html";
    const currentUrl = page.url();

    return {
      _success: currentUrl.startsWith(expectedUrl),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/ionwave_observe.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const ionwave_observe: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/ionwave/",
    );

    const observations = await v3.observe();

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const expectedLocator = `#Form1 > div:nth-child(5) > div:nth-child(1) > a`;

    const expectedResult = await page
      .locator(expectedLocator)
      .first()
      .innerText();

    let foundMatch = false;
    for (const observation of observations) {
      try {
        const observationResult = await page
          .locator(observation.selector)
          .first()
          .innerText();

        if (observationResult === expectedResult) {
          foundMatch = true;
          break;
        }
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error.message,
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      expected: expectedResult,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/login.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const login: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/login/",
    );

    await v3.act("type %nunya% into the username field", {
      variables: { nunya: "business" },
    });

    const xpath = "xpath=/html/body/main/form/div[1]/input";
    const actualValue = await page.locator(xpath).inputValue();

    const expectedValue = "business";

    return {
      _success: actualValue === expectedValue,
      expectedValue,
      actualValue,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/multi_tab.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const multi_tab: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/",
    );

    await v3.act("click the button to open the other page");
    await v3.act("click the button to open the other page");
    await v3.act("click the button to open the other page");
    await v3.act("click the button to open the other page");
    let activePage = await v3.context.awaitActivePage();

    let currentPageUrl = await activePage.url();
    let expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/page5.html";

    if (currentPageUrl !== expectedUrl) {
      return {
        _success: false,
        message: "expected URL does not match current URL",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    // try acting on the first page again
    const pages = v3.context.pages();
    const page1 = pages[0];
    await v3.act("click the button to open the other page", { page: page1 });

    activePage = await v3.context.awaitActivePage();
    currentPageUrl = await activePage.url();
    expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/five-tab/page2.html";
    if (currentPageUrl !== expectedUrl) {
      return {
        _success: false,
        message: "expected URL does not match current URL",
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const page2text = await v3.extract({ page: activePage });
    const expectedPage2text = "You've made it to page 2";

    if (page2text.pageText.includes(expectedPage2text)) {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `extracted page text: ${page2text.pageText} does not match expected page text: ${expectedPage2text}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/namespace_xpath.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const namespace_xpath: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/namespaced-xpath/",
    );

    await v3.act("fill 'nunya' into the 'type here' form");

    const inputValue = await page.locator("#ns-text").inputValue();
    // confirm that the form was filled
    const formHasBeenFilled = inputValue === "nunya";

    return {
      _success: formHasBeenFilled,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/nested_iframes_2.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const nested_iframes_2: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/nested-iframes-2/",
    );

    await v3.act("click the button called 'click me (inner 2)'");

    const inner = page
      .frameLocator('iframe[src="iframe2.html"]')
      .frameLocator('iframe[src="inner2.html"]');

    const messageText = await inner.locator("#msg").textContent();

    const passed: boolean =
      messageText.toLowerCase().trim() ===
      "clicked the button in the second inner iframe";

    return {
      _success: passed,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
      error,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/next_chunk.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const next_chunk: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.apartments.com/san-francisco-ca/", {
      waitUntil: "domcontentloaded",
    });
    await v3.act("click on the all filters button");

    const { initialScrollTop, chunkHeight } = await page.evaluate(() => {
      const container = document.querySelector(
        "#advancedFilters > div",
      ) as HTMLElement;
      if (!container) {
        console.warn(
          "Could not find #advancedFilters > div. Returning 0 for measurements.",
        );
        return { initialScrollTop: 0, chunkHeight: 0 };
      }
      return {
        initialScrollTop: container.scrollTop,
        chunkHeight: container.getBoundingClientRect().height,
      };
    });

    await v3.act("scroll down one chunk on the filters modal");

    await new Promise((resolve) => setTimeout(resolve, 2000));

    const newScrollTop = await page.evaluate(() => {
      const container = document.querySelector(
        "#advancedFilters > div",
      ) as HTMLElement;
      return container?.scrollTop ?? 0;
    });

    const actualDiff = newScrollTop - initialScrollTop;
    const threshold = 20; // allowable difference in px
    const scrolledOneChunk = Math.abs(actualDiff - chunkHeight) <= threshold;

    const evaluationResult = scrolledOneChunk
      ? {
          _success: true,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Successfully scrolled ~one chunk: expected ~${chunkHeight}, got ${actualDiff}`,
        }
      : {
          _success: false,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Scroll difference expected ~${chunkHeight} but only scrolled ${actualDiff}.`,
        };

    return evaluationResult;
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/no_js_click.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { Action } from "@browserbasehq/stagehand";

export const no_js_click: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  /**
   * This eval is meant to test whether our `clickElement` function
   * (inside actHandlerUtils.ts) is able to click elements even if
   * the site blocks programmatic JS click events.
   */

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/no-js-click/",
    );

    const observeResult: Action = {
      method: "click",
      selector: "xpath=/html/body/button",
      description: "the button to click",
      arguments: [],
    };
    await v3.act(observeResult);

    const text = await page.locator("#success-msg").textContent();
    if (text?.trim() === "click succeeded") {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: "unable to click element on website that blocks JS click events",
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error attempting to click the button: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/nonsense_action.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const nonsense_action: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.homedepot.com/");

    const result = await v3.act("what is the capital of the moon?");

    return {
      _success: !result.success, // We expect this to fail
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_amazon_add_to_cart.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_amazon_add_to_cart: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/amazon/",
    );

    const observations1 = await v3.observe(
      "Find and click the 'Add to Cart' button",
    );

    // Example of using performPlaywrightMethod if you have the xpath
    if (observations1.length > 0) {
      const action1 = observations1[0];
      await v3.act(action1);
    }

    const observations2 = await v3.observe(
      "Find and click the 'Proceed to checkout' button",
    );

    // Example of using performPlaywrightMethod if you have the xpath
    if (observations2.length > 0) {
      const action2 = observations2[0];
      await v3.act(action2);
    }

    const currentUrl = page.url();
    const expectedUrlPrefix =
      "https://browserbase.github.io/stagehand-eval-sites/sites/amazon/sign-in.html";

    return {
      _success: currentUrl.startsWith(expectedUrlPrefix),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_github.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_github: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/github/",
    );

    const observations = await v3.observe(
      "find the scrollable element that holds the repos file tree.",
    );

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const possibleLocators = [
      `#repo-content-pjax-container > react-app > div > div > div.prc-PageLayout-PageLayoutRoot-1zlEO > div > div > div.Box-sc-g0xbh4-0.gISSDQ`,
      `#repo-content-pjax-container > react-app > div > div > div.prc-PageLayout-PageLayoutRoot-1zlEO > div > div > div.Box-sc-g0xbh4-0.gISSDQ > div`,
      `#repo-content-pjax-container > react-app > div > div > div.prc-PageLayout-PageLayoutRoot-1zlEO > div > div > div.Box-sc-g0xbh4-0.gISSDQ > div > div.prc-PageLayout-Pane-Vl5LI`,
      `#repo-content-pjax-container > react-app > div > div > div.prc-PageLayout-PageLayoutRoot-1zlEO > div > div > div.Box-sc-g0xbh4-0.gISSDQ > div > div.prc-PageLayout-Pane-Vl5LI > div`,
      `#repos-file-tree > div.Box-sc-g0xbh4-0.ReposFileTreePane-module__Box_5--tQNH_`,
      `#repos-file-tree > div.Box-sc-g0xbh4-0.ReposFileTreePane-module__Box_5--tQNH_ > div`,
      `#repos-file-tree > div.Box-sc-g0xbh4-0.ReposFileTreePane-module__Box_5--tQNH_ > div > div`,
      `#repos-file-tree > div.Box-sc-g0xbh4-0.ReposFileTreePane-module__Box_5--tQNH_ > div > div > div > nav`,
      `#repos-file-tree > div.Box-sc-g0xbh4-0.ReposFileTreePane-module__Box_5--tQNH_ > div > div > div > nav > ul`,
    ];

    // Precompute candidate backendNodeIds
    const candidateIds = new Map<string, number>();
    for (const sel of possibleLocators) {
      try {
        const id = await page.locator(sel).backendNodeId();
        candidateIds.set(sel, id);
      } catch {
        // ignore candidates that fail to resolve
      }
    }

    let foundMatch = false;
    let matchedLocator: string | null = null;

    for (const observation of observations) {
      try {
        const obsId = await page.locator(observation.selector).backendNodeId();
        for (const [candSel, candId] of candidateIds) {
          if (candId === obsId) {
            foundMatch = true;
            matchedLocator = candSel;
            break;
          }
        }
        if (foundMatch) break;
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error?.message ?? String(error),
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      matchedLocator,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_iframes1.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_iframes1: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/iframe-hn/",
    );

    const observations = await v3.observe("find the main header of the page");

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const possibleLocators = [
      `body > main > section.iframe-wrapper > iframe`,
      `body > header > h1`,
    ];

    // Precompute candidate backendNodeIds
    const candidateIds = new Map<string, number>();
    for (const sel of possibleLocators) {
      try {
        const id = await page.locator(sel).backendNodeId();
        candidateIds.set(sel, id);
      } catch {
        // ignore candidates that fail to resolve
      }
    }

    let foundMatch = false;
    let matchedLocator: string | null = null;

    for (const observation of observations) {
      try {
        const obsId = await page.locator(observation.selector).backendNodeId();
        for (const [candSel, candId] of candidateIds) {
          if (candId === obsId) {
            foundMatch = true;
            matchedLocator = candSel;
            break;
          }
        }
        if (foundMatch) break;
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error?.message ?? String(error),
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      matchedLocator,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_iframes2.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { Action } from "@browserbasehq/stagehand";

export const observe_iframes2: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://iframetester.com/?url=https://shopify.com");
    await new Promise((resolve) => setTimeout(resolve, 5000));

    let observations: Action[];
    try {
      observations = await v3.observe("find the main header of the page");
    } catch (err) {
      return {
        _success: false,
        message: err.message,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const possibleLocators = [`#iframe-window`, `body > header > h1`];

    // Precompute candidate backendNodeIds
    const candidateIds = new Map<string, number>();
    for (const sel of possibleLocators) {
      try {
        const id = await page.locator(sel).backendNodeId();
        candidateIds.set(sel, id);
      } catch {
        // ignore candidates that fail to resolve
      }
    }

    let foundMatch = false;
    let matchedLocator: string | null = null;

    for (const observation of observations) {
      try {
        const obsId = await page.locator(observation.selector).backendNodeId();
        for (const [candSel, candId] of candidateIds) {
          if (candId === obsId) {
            foundMatch = true;
            matchedLocator = candSel;
            break;
          }
        }
        if (foundMatch) break;
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error?.message ?? String(error),
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      matchedLocator,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_simple_google_search.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_simple_google_search: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/google/",
    );
    const observation1 = await v3.observe(
      "Find the search bar and type 'OpenAI'",
    );

    if (observation1.length > 0) {
      const action1 = observation1[0];
      await v3.act(action1);
    }
    const observation2 = await v3.observe("Press enter");

    if (observation2.length > 0) {
      const action2 = observation2[0];
      await v3.act(action2);
    }
    await new Promise((resolve) => setTimeout(resolve, 3000));

    const expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/google/openai.html";
    const currentUrl = page.url();

    return {
      _success: currentUrl.startsWith(expectedUrl),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_taxes.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_taxes: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://file.1040.com/estimate/");

    const observations = await v3.observe(
      "Find all the form input elements under the 'Income' section",
    );

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    } else if (observations.length < 13) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const expectedLocator = `#tpWages`;

    const expectedResult = await page
      .locator(expectedLocator)
      .first()
      .innerText();

    let foundMatch = false;
    for (const observation of observations) {
      try {
        const observationResult = await page
          .locator(observation.selector)
          .first()
          .innerText();

        if (observationResult === expectedResult) {
          foundMatch = true;
          break;
        }
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error.message,
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      expected: expectedResult,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_vantechjournal.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_vantechjournal: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://vantechjournal.com/archive");

    const observations = await v3.observe("Find the 'load more' link");

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const expectedLocators = [
      "xpath=/html/body/div[2]/div/section/div/div/div[3]/a",
      "xpath=/html/body/div[2]/div/section/div/div/div[3]/a/span",
    ];

    const expectedIds: number[] = [];
    for (const locator of expectedLocators) {
      const node = page.locator(locator);
      const id = await node.backendNodeId();
      if (id !== undefined && id !== null) expectedIds.push(id);
    }

    const observedNode = page.locator(observations[0].selector);
    const observedId = await observedNode.backendNodeId();

    const foundMatch = expectedIds.includes(observedId);

    return {
      _success: foundMatch,
      expected: expectedLocators,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error: unknown) {
    return {
      _success: false,
      error: error instanceof Error ? error.message : String(error),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/observe_yc_startup.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const observe_yc_startup: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.ycombinator.com/companies", {
      waitUntil: "networkidle",
    });

    const observations = await v3.observe(
      "Click the container element that holds links to each of the startup companies. The companies each have a name, a description, and a link to their website.",
    );

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const possibleLocators = [
      `div._rightCol_zhfs4_592`,
      `div._section_zhfs4_163._results_zhfs4_343`,
    ];

    // Precompute candidate backendNodeIds
    const candidateIds = new Map<string, number>();
    for (const sel of possibleLocators) {
      try {
        const id = await page.locator(sel).backendNodeId();
        candidateIds.set(sel, id);
      } catch {
        // ignore candidates that fail to resolve
      }
    }

    let foundMatch = false;
    let matchedLocator: string | null = null;

    for (const observation of observations) {
      try {
        const obsId = await page.locator(observation.selector).backendNodeId();
        for (const [candSel, candId] of candidateIds) {
          if (candId === obsId) {
            foundMatch = true;
            matchedLocator = candSel;
            break;
          }
        }
        if (foundMatch) break;
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error?.message ?? String(error),
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      matchedLocator,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/oopif_in_csr.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const oopif_in_csr: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // fill a form inside a OOPIF (out of process iframe) that is inside an
  // CSR (closed mode shadow) root

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-open-shadow-dom/",
    );
    await v3.act("fill 'nunya' into the first name field");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("nunya")) {
      return {
        _success: true,
        message: `successfully filled the form`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to fill the form`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/oopif_in_osr.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const oopif_in_osr: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // fill a form inside a OOPIF (out of process iframe) that is inside an
  // OSR (open mode shadow) root

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/oopif-in-open-shadow-dom/",
    );
    await v3.act("fill 'nunya' into the first name field");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("nunya")) {
      return {
        _success: true,
        message: `successfully filled the form`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to fill the form`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/os_dropdown.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const os_dropdown: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  /**
   * This eval is meant to test whether we can correctly select an element
   * from an OS level dropdown
   */

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/nested-dropdown/",
    );

    await v3.act(
      "choose 'Smog Check Technician' from the 'License Type' dropdown",
    );
    const selectedOption = await page
      .locator("#licenseType >> option:checked")
      .textContent();

    if (selectedOption === "Smog Check Technician") {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: "incorrect option selected from the dropdown",
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error attempting to select an option from the dropdown: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/osr_in_oopif.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const osr_in_oopif: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // click inside an OSR (open mode shadow) root that is inside an
  // OOPIF (out of process iframe)

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/open-shadow-root-in-oopif/",
    );
    await v3.act("click the button");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        message: `successfully clicked the button`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to click on the button`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/osr_in_spif.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const osr_in_spif: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // click inside an OSR (open mode shadow) root that is inside an
  // SPIF (same process iframe)

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/open-shadow-root-in-spif/",
    );
    await v3.act("click the button");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        message: `successfully clicked the button`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to click on the button`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/panamcs.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const panamcs: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/panamcs/",
    );

    const observations = await v3.observe("click the 'about us' link");

    if (observations.length === 0) {
      return {
        _success: false,
        observations,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    const expectedLocator = `#menu > li:nth-child(1) > a`;

    const expectedResult = await page
      .locator(expectedLocator)
      .first()
      .innerText();

    let foundMatch = false;
    for (const observation of observations) {
      try {
        const observationResult = await page
          .locator(observation.selector)
          .first()
          .innerText();

        if (observationResult === expectedResult) {
          foundMatch = true;
          break;
        }
      } catch (error) {
        console.warn(
          `Failed to check observation with selector ${observation.selector}:`,
          error.message,
        );
        continue;
      }
    }

    return {
      _success: foundMatch,
      expected: expectedResult,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/peeler_complex.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const peeler_complex: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(`https://chefstoys.com/`, { timeoutMs: 60000 });
    await page.waitForLoadState("networkidle");

    await v3.act("find the button to close the popup");
    await v3.act("search for %search_query%", {
      variables: {
        search_query: "peeler",
      },
    });

    await v3.act('click on the first "OXO" brand peeler');

    const { price } = await v3.extract(
      "get the price of the peeler",
      z.object({ price: z.number().nullable() }),
    );

    return {
      _success: price === 11.99,
      price,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    logger.error({
      message: "error in peeler_complex function",
      level: 0,
      auxiliary: {
        error: {
          value: JSON.stringify(error, null, 2),
          type: "object",
        },
        trace: {
          value: error.stack,
          type: "string",
        },
      },
    });

    return {
      _success: false,
      error: JSON.parse(JSON.stringify(error, null, 2)),
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/prev_chunk.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const prev_chunk: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    await new Promise((resolve) => setTimeout(resolve, 2000));
    const { initialScrollTop, chunkHeight } = await page.evaluate(() => {
      const halfPage = document.body.scrollHeight / 2;

      window.scrollTo({
        top: halfPage,
        left: 0,
        behavior: "instant",
      });

      const chunk = window.innerHeight;

      return {
        initialScrollTop: window.scrollY,
        chunkHeight: chunk,
      };
    });
    await new Promise((resolve) => setTimeout(resolve, 2000));
    await v3.act("scroll up one chunk");

    await new Promise((resolve) => setTimeout(resolve, 5000));

    const finalScrollTop = await page.evaluate(() => window.scrollY);

    const actualDiff = initialScrollTop - finalScrollTop;
    const threshold = 20; // px tolerance
    const scrolledOneChunk = Math.abs(actualDiff - chunkHeight) <= threshold;

    const evaluationResult = scrolledOneChunk
      ? {
          _success: true,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Successfully scrolled ~one chunk UP: expected ~${chunkHeight}, got ${actualDiff}.`,
        }
      : {
          _success: false,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Scroll difference expected ~${chunkHeight} but only scrolled ${actualDiff}.`,
        };

    return evaluationResult;
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/radio_btn.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const radio_btn: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/paneer-pizza/",
    );

    await v3.act("click the 'medium' option");

    // confirm that the Medium radio is now checked
    const radioBtnClicked = await page
      .locator('input[type="radio"][name="Pizza"][value="Medium"]')
      .isChecked();

    return {
      _success: radioBtnClicked,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/rakuten_jp.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const rakuten_jp: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.rakuten.co.jp/");

    await v3.act("type '香菜' into the search bar");
    await v3.act("press enter");
    const url = page.url();
    const successUrl =
      "https://search.rakuten.co.jp/search/mall/%E9%A6%99%E8%8F%9C/";

    return {
      _success: url === successUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/sciquest.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const sciquest: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://bids.sciquest.com/apps/Router/PublicEvent?tab=PHX_NAV_SourcingAllOpps&CustomerOrg=StateOfUtah",
    );

    await v3.act('Click on the "Closed" tab');

    const result = await v3.extract(
      "Extract the total number of results that the search produced. Not the number of results displayed on the page.",
      z.object({
        total_results: z.string(),
      }),
    );

    const { total_results } = result;

    const expectedNumber = 12637;
    const extractedNumber = parseInt(total_results.replace(/[^\d]/g, ""), 10);

    const isWithinRange =
      extractedNumber >= expectedNumber - 1000 &&
      extractedNumber <= expectedNumber + 1000;

    if (!isWithinRange) {
      logger.error({
        message: "Total number of results is not within the expected range",
        level: 0,
        auxiliary: {
          expected: {
            value: `${expectedNumber} ± 1000`,
            type: "string",
          },
          actual: {
            value: extractedNumber.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Total number of results is not within the expected range",
        extractedNumber,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      extractedNumber,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/scroll_50.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const scroll_50: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    await v3.act("Scroll 50% down the page");

    await new Promise((resolve) => setTimeout(resolve, 5000));

    // Get the current scroll position and total scroll height
    const scrollInfo = await page.evaluate(() => {
      return {
        scrollTop: window.scrollY + window.innerHeight / 2,
        scrollHeight: document.documentElement.scrollHeight,
      };
    });

    const halfwayScroll = scrollInfo.scrollHeight / 2;
    const halfwayReached =
      Math.abs(scrollInfo.scrollTop - halfwayScroll) <= 200;
    const evaluationResult = halfwayReached
      ? {
          _success: true,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
        }
      : {
          _success: false,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Scroll position (${scrollInfo.scrollTop}px) is not halfway down the page (${halfwayScroll}px).`,
        };

    return evaluationResult;
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/scroll_75.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const scroll_75: EvalFunction = async ({
  logger,
  debugUrl,
  sessionUrl,
  v3,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/aigrant/",
    );
    await v3.act("Scroll 75% down the page");

    await new Promise((resolve) => setTimeout(resolve, 5000));

    // Get the current scroll position and total scroll height
    const scrollInfo = await page.evaluate(() => {
      return {
        scrollTop: window.scrollY + window.innerHeight * 0.75,
        scrollHeight: document.documentElement.scrollHeight,
      };
    });

    const threeQuartersScroll = scrollInfo.scrollHeight * 0.75;
    const threeQuartersReached =
      Math.abs(scrollInfo.scrollTop - threeQuartersScroll) <= 200;
    const evaluationResult = threeQuartersReached
      ? {
          _success: true,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
        }
      : {
          _success: false,
          logs: logger.getLogs(),
          debugUrl,
          sessionUrl,
          message: `Scroll position (${scrollInfo.scrollTop}px) is not three quarters down the page (${threeQuartersScroll}px).`,
        };

    return evaluationResult;
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/shadow_dom.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const shadow_dom: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/shadow-dom/",
    );
    await v3.act("click the button");
    const extraction = await v3.extract("extract the page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/simple_google_search.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const simple_google_search: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/google/",
    );

    await v3.act('type "OpenAI" into the search bar');

    await v3.act("press enter");

    const expectedUrl =
      "https://browserbase.github.io/stagehand-eval-sites/sites/google/openai.html";
    const currentUrl = page.url();

    return {
      _success: currentUrl.startsWith(expectedUrl),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/spif_in_csr.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const spif_in_csr: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // click inside a SPIF (same process iframe) that is inside an
  // CSR (closed mode shadow) root
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-closed-shadow-dom/",
    );
    await v3.act("click the button");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        message: `successfully clicked the button`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to click on the button`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/spif_in_osr.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const spif_in_osr: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  // this eval is designed to test whether stagehand can successfully
  // click inside a SPIF (same process iframe) that is inside an
  // OSR (open mode shadow) root

  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/spif-in-open-shadow-dom/",
    );
    await v3.act("click the button");

    const extraction = await v3.extract("extract the entire page text");

    const pageText = extraction.extraction;

    if (pageText.includes("button successfully clicked")) {
      return {
        _success: true,
        message: `successfully clicked the button`,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }
    return {
      _success: false,
      message: `unable to click on the button`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: `error: ${error.message}`,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/stock_x.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const stock_x: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://stockx.com/air-jordan-3-retro-black-cement-2024");

    await v3.act("click on Jordan 3 Retro Crimson in the related products");

    const currentUrl = page.url();
    const expectedUrlPrefix = "https://stockx.com/jordan-3-retro-crimson";

    await v3.close();

    return {
      _success: currentUrl.startsWith(expectedUrlPrefix),
      currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/tab_handling.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const tab_handling: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/new-tab/",
    );

    await v3.act("click the button to open the other page");

    const pages = v3.context.pages();
    const page1 = pages[0];
    const page2 = pages[1];

    // extract all the text from the first page
    const extraction1 = await v3.extract({ page: page1 });
    // extract all the text from the second page
    const extraction2 = await v3.extract({ page: page2 });

    const extraction1Success = extraction1.pageText.includes("Welcome!");
    const extraction2Success = extraction2.pageText.includes(
      "You’re on the other page",
    );

    return {
      _success: extraction1Success && extraction2Success,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      message: error.message,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/ted_talk.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { normalizeString } from "../utils.js";
import { z } from "zod";

export const ted_talk: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://www.ted.com/talks/sir_ken_robinson_do_schools_kill_creativity",
      {
        waitUntil: "domcontentloaded",
      },
    );

    await v3.act("scroll 10% down the page");

    await new Promise((resolve) => setTimeout(resolve, 5000));

    await v3.act(
      "Click the link that takes you to the page about the 'Culture' topic",
    );

    const playlists = await v3.extract(
      "Extract the video playlist titles and the number of talks in each playlist. This info is in the Video Playlists about Culture section of the webpage.",
      z.object({
        playlists: z
          .array(
            z.object({
              title: z.string().describe("Title of the playlist"),
              num_talks: z.number().describe("Number of talks in the playlist"),
            }),
          )
          .describe("List of culture video playlists"),
      }),
    );

    const expectedPlaylists = [
      {
        title: "Talks that celebrate the boundless creativity of an open mind",
        num_talks: 6,
      },
      {
        title: "Little-known big history",
        num_talks: 15,
      },
      {
        title: "Extraordinary, larger-than-life art",
        num_talks: 10,
      },
      {
        title: "How perfectionism fails us",
        num_talks: 4,
      },
    ];

    if (!playlists.playlists || playlists.playlists.length === 0) {
      logger.error({
        message: "Failed to extract playlists on culture",
        level: 0,
      });

      return {
        _success: false,
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    const missingPlaylists = expectedPlaylists.filter((expected) =>
      playlists.playlists.every(
        (extracted) =>
          normalizeString(extracted.title) !==
            normalizeString(expected.title) ||
          extracted.num_talks !== expected.num_talks,
      ),
    );

    if (missingPlaylists.length > 0) {
      logger.error({
        message: "Extracted playlists do not match expected playlists",
        level: 0,
        auxiliary: {
          missing: {
            value: JSON.stringify(missingPlaylists),
            type: "object",
          },
          extracted: {
            value: JSON.stringify(playlists.playlists),
            type: "object",
          },
        },
      });

      return {
        _success: false,
        error: "Extracted playlists do not match expected playlists",
        logs: logger.getLogs(),
        debugUrl,
        sessionUrl,
      };
    }

    return {
      _success: true,
      playlists: playlists.playlists,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      logs: logger.getLogs(),
      debugUrl,
      sessionUrl,
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/vanta_h.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const vanta_h: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://www.vanta.com/");

    const observations = await v3.observe(
      "click the buy now button if it is available",
    );

    // we should have no saved observation since the element shouldn't exist
    return {
      _success: observations.length === 0,
      observations,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/vantechjournal.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const vantechjournal: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto("https://vantechjournal.com");

    await v3.act("click on page 'recommendations'");

    const expectedUrl = "https://vantechjournal.com/recommendations";
    const currentUrl = page.url();

    return {
      _success: currentUrl === expectedUrl,
      currentUrl,
      expectedUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/wichita.ts
================================================
import { EvalFunction } from "../types/evals.js";
import { z } from "zod";

export const wichita: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(
      "https://browserbase.github.io/stagehand-eval-sites/sites/wichita/",
    );

    await v3.act('Click on "Show Closed/Awarded/Cancelled bids"');

    const result = await v3.extract(
      "Extract the total number of bids that the search produced.",
      z.object({
        total_results: z.number(),
      }),
    );

    const { total_results } = result;

    const expectedNumber = 430;

    if (total_results !== expectedNumber) {
      logger.error({
        message: "Total number of results does not match expected",
        level: 0,
        auxiliary: {
          expected: {
            value: expectedNumber.toString(),
            type: "integer",
          },
          actual: {
            value: total_results.toString(),
            type: "integer",
          },
        },
      });
      return {
        _success: false,
        error: "Total number of results does not match expected",
        total_results,
        debugUrl,
        sessionUrl,
        logs: logger.getLogs(),
      };
    }

    return {
      _success: true,
      total_results,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tasks/wikipedia.ts
================================================
import { EvalFunction } from "../types/evals.js";

export const wikipedia: EvalFunction = async ({
  debugUrl,
  sessionUrl,
  v3,
  logger,
}) => {
  try {
    const page = v3.context.pages()[0];
    await page.goto(`https://en.wikipedia.org/wiki/Baseball`);
    await v3.act('click the "hit and run" link in this article', {
      timeout: 360_000,
    });

    const url = "https://en.wikipedia.org/wiki/Hit_and_run_(baseball)";
    const currentUrl = page.url();

    return {
      _success: currentUrl === url,
      expected: url,
      actual: currentUrl,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } catch (error) {
    return {
      _success: false,
      error: error,
      debugUrl,
      sessionUrl,
      logs: logger.getLogs(),
    };
  } finally {
    await v3.close();
  }
};


================================================
FILE: packages/evals/tsconfig.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "baseUrl": ".",
    "rootDir": ".",
    "outDir": "dist/esm",
    "noEmit": false,
    "paths": {
      "@browserbasehq/stagehand": ["../core/dist/esm/index.d.ts"]
    }
  },
  "include": ["**/*.ts"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: packages/evals/types/evals.ts
================================================
import { z } from "zod";
import type { AvailableModel } from "@browserbasehq/stagehand";
import type { LogLine } from "@browserbasehq/stagehand";
import type { AgentInstance } from "@browserbasehq/stagehand";
import type { EvalCase } from "braintrust";
import type { V3 } from "@browserbasehq/stagehand";
import { EvalLogger } from "../logger.js";

export type StagehandInitResult = {
  v3?: V3;
  v3Agent?: AgentInstance;
  logger: EvalLogger;
  debugUrl: string;
  sessionUrl: string;
  modelName: AvailableModel;
  agent: AgentInstance;
};

export type EvalFunction = (
  taskInput: StagehandInitResult & { input: EvalInput },
) => Promise<{
  _success: boolean;
  logs: LogLine[];
  debugUrl: string;
  sessionUrl: string;
  error?: unknown;
}>;

export const EvalCategorySchema = z.enum([
  "observe",
  "act",
  "combination",
  "extract",
  "experimental",
  "targeted_extract",
  "regression",
  "regression_llm_providers",
  "llm_clients",
  "agent",
  "external_agent_benchmarks",
]);

export type EvalCategory = z.infer<typeof EvalCategorySchema>;
export interface EvalInput {
  name: string;
  modelName: AvailableModel;
  isCUA?: boolean;
  // Optional per-test parameters, used by data-driven tasks
  params?: Record<string, unknown>;
}

export interface Testcase
  extends EvalCase<
    EvalInput,
    unknown,
    {
      model: AvailableModel;
      test: string;
      categories?: string[];
      category?: string;
      dataset?: string;
      task_id?: string;
      website?: string;
      difficulty?: string;
    }
  > {
  input: EvalInput;
  name: string;
  tags: string[];
  metadata: {
    model: AvailableModel;
    test: string;
    categories?: string[];
    category?: string;
    dataset?: string;
    task_id?: string;
    website?: string;
    difficulty?: string;
    task_category?: string;
  };
  expected: unknown;
}

export interface SummaryResult {
  input: EvalInput;
  output: { _success: boolean };
  name: string;
  score: number;
}

export interface EvalArgs<TInput, TOutput, TExpected> {
  input: TInput;
  output: TOutput;
  expected: TExpected;
  metadata?: { model: AvailableModel; test: string };
}

export interface EvalResult {
  name: string;
  score: number;
}

export type LogLineEval = LogLine & {
  parsedAuxiliary?: string | object;
};

export type AgentModelEntry = {
  modelName: string;
  cua: boolean;
};


================================================
FILE: packages/evals/types/screenshotCollector.ts
================================================
export interface ScreenshotCollectorOptions {
  /**
   * Interval in ms for polling-based screenshot capture.
   * If provided, start() will begin polling at this interval.
   * If omitted, use addScreenshot() via the V3 event bus for event-driven collection.
   */
  interval?: number;
  maxScreenshots?: number;
}

// Minimal page-like interface: supports screenshot() and optional event hooks
export type ScreenshotCapablePage = {
  screenshot: (...args: []) => Promise<Buffer | string>;
  on?: (event: string, listener: (...args: []) => void) => void;
  off?: (event: string, listener: (...args: []) => void) => void;
};


================================================
FILE: packages/evals/utils/ScreenshotCollector.ts
================================================
import { V3 } from "@browserbasehq/stagehand";
import sharp from "sharp";
import { ScreenshotCollectorOptions } from "../types/screenshotCollector.js";

export class ScreenshotCollector {
  private screenshots: Buffer[] = [];
  private v3: V3;
  private interval?: number;
  private maxScreenshots: number;
  private intervalId?: NodeJS.Timeout;
  private isCapturing: boolean = false;
  private lastScreenshot?: Buffer;
  private ssimThreshold: number = 0.75;
  private mseThreshold: number = 30;
  private stopped: boolean = false;

  constructor(v3: V3, options: ScreenshotCollectorOptions = {}) {
    this.v3 = v3;
    this.interval = options.interval; // undefined means event-driven mode
    this.maxScreenshots = options.maxScreenshots || 10;
  }

  /**
   * Start interval-based screenshot capture.
   * Only activates if interval option was provided in constructor.
   * For event-driven collection, use addScreenshot() directly via the V3 event bus.
   */
  start(): void {
    // Only start interval if interval was provided
    if (!this.interval) {
      return;
    }

    if (this.intervalId) {
      return;
    }

    // Set up time-based screenshot capture
    this.intervalId = setInterval(() => {
      this.captureScreenshot("interval").catch((error) => {
        console.error("Interval screenshot failed:", error);
      });
    }, this.interval);

    // Capture initial screenshot without blocking
    this.captureScreenshot("initial").catch((error) => {
      console.error("Failed to capture initial screenshot:", error);
    });
  }

  async stop(): Promise<Buffer[]> {
    // Mark as stopped first to prevent any new operations
    this.stopped = true;

    // Clear interval if running
    if (this.intervalId) {
      clearInterval(this.intervalId);
      this.intervalId = undefined;
    }

    // Reset capturing flag to unblock any pending state
    this.isCapturing = false;

    // Try to capture final screenshot, but don't fail if CDP is disconnected
    try {
      await this.captureScreenshot("final");
    } catch {
      // Ignore errors - CDP may be disconnected
    }

    // Return a copy and clear internal state to free memory
    const result = [...this.screenshots];
    this.screenshots = [];
    this.lastScreenshot = undefined;

    return result;
  }

  private async captureScreenshot(trigger: string): Promise<void> {
    // Don't capture if stopped (unless it's the final capture) or already capturing
    if ((this.stopped && trigger !== "final") || this.isCapturing) {
      return;
    }
    this.isCapturing = true;

    try {
      const page = await this.v3.context.awaitActivePage();
      const screenshot = await page.screenshot({ fullPage: false });

      // If stopped while awaiting screenshot (and not final), don't process further
      if (this.stopped && trigger !== "final") {
        return;
      }

      // Check if we should keep this screenshot based on image diff
      let shouldKeep = true;
      if (this.lastScreenshot && trigger !== "initial" && trigger !== "final") {
        try {
          // First do a quick MSE check
          const mse = await this.calculateMSE(this.lastScreenshot, screenshot);
          if (mse < this.mseThreshold) {
            // Very similar, skip
            shouldKeep = false;
          } else {
            // Significant difference detected, verify with SSIM
            const ssim = await this.calculateSSIM(
              this.lastScreenshot,
              screenshot,
            );
            shouldKeep = ssim < this.ssimThreshold;
          }
        } catch (error) {
          // If comparison fails, keep the screenshot
          console.error("Image comparison failed:", error);
          shouldKeep = true;
        }
      }

      if (shouldKeep) {
        this.screenshots.push(screenshot);
        this.lastScreenshot = screenshot;

        if (this.screenshots.length > this.maxScreenshots) {
          this.screenshots.shift();
        }
      }
    } catch (error) {
      console.error(`Failed to capture screenshot (${trigger}):`, error);
    } finally {
      this.isCapturing = false;
    }
  }

  getScreenshots(): Buffer[] {
    return [...this.screenshots];
  }

  getScreenshotCount(): number {
    return this.screenshots.length;
  }

  clear(): void {
    this.screenshots = [];
  }

  /**
   * Manually add a screenshot buffer to the collection.
   * @param screenshot The screenshot buffer to add
   */
  async addScreenshot(screenshot: Buffer): Promise<void> {
    // Don't add if stopped or already capturing
    if (this.stopped || this.isCapturing) {
      return;
    }
    this.isCapturing = true;

    try {
      // Apply MSE/SSIM logic to decide if we should keep this screenshot
      let shouldKeep = true;
      if (this.lastScreenshot) {
        try {
          // First do a quick MSE check
          const mse = await this.calculateMSE(this.lastScreenshot, screenshot);
          if (mse < this.mseThreshold) {
            // Very similar, skip
            shouldKeep = false;
          } else {
            // Significant difference detected, verify with SSIM
            const ssim = await this.calculateSSIM(
              this.lastScreenshot,
              screenshot,
            );
            shouldKeep = ssim < this.ssimThreshold;
          }
        } catch (error) {
          // If comparison fails, keep the screenshot
          console.error("Image comparison failed:", error);
          shouldKeep = true;
        }
      }

      if (shouldKeep) {
        this.screenshots.push(screenshot);
        this.lastScreenshot = screenshot;

        if (this.screenshots.length > this.maxScreenshots) {
          this.screenshots.shift();
        }
      }
    } finally {
      this.isCapturing = false;
    }
  }

  private async calculateMSE(img1: Buffer, img2: Buffer): Promise<number> {
    try {
      // Resize images for faster comparison
      const size = { width: 400, height: 300 };
      const data1 = await sharp(img1).resize(size).raw().toBuffer();
      const data2 = await sharp(img2).resize(size).raw().toBuffer();

      if (data1.length !== data2.length) return Number.MAX_SAFE_INTEGER;

      let sum = 0;
      for (let i = 0; i < data1.length; i++) {
        const diff = data1[i] - data2[i];
        sum += diff * diff;
      }

      return sum / data1.length;
    } catch {
      // If sharp is not available, assume images are different
      return Number.MAX_SAFE_INTEGER;
    }
  }

  private async calculateSSIM(img1: Buffer, img2: Buffer): Promise<number> {
    try {
      // Resize and convert to grayscale for SSIM calculation
      const size = { width: 400, height: 300 };
      const gray1 = await sharp(img1).resize(size).grayscale().raw().toBuffer();
      const gray2 = await sharp(img2).resize(size).grayscale().raw().toBuffer();

      if (gray1.length !== gray2.length) return 0;

      // Simplified SSIM calculation
      const c1 = 0.01 * 0.01;
      const c2 = 0.03 * 0.03;

      let sum1 = 0,
        sum2 = 0,
        sum1_sq = 0,
        sum2_sq = 0,
        sum12 = 0;
      const N = gray1.length;

      for (let i = 0; i < N; i++) {
        sum1 += gray1[i];
        sum2 += gray2[i];
        sum1_sq += gray1[i] * gray1[i];
        sum2_sq += gray2[i] * gray2[i];
        sum12 += gray1[i] * gray2[i];
      }

      const mean1 = sum1 / N;
      const mean2 = sum2 / N;
      const var1 = sum1_sq / N - mean1 * mean1;
      const var2 = sum2_sq / N - mean2 * mean2;
      const cov12 = sum12 / N - mean1 * mean2;

      const numerator = (2 * mean1 * mean2 + c1) * (2 * cov12 + c2);
      const denominator =
        (mean1 * mean1 + mean2 * mean2 + c1) * (var1 + var2 + c2);

      return numerator / denominator;
    } catch {
      // If sharp is not available, assume images are different
      return 0;
    }
  }
}


================================================
FILE: packages/evals/utils/imageResize.ts
================================================
import sharp from "sharp";

export async function imageResize(
  img: Buffer,
  scaleFactor: number,
): Promise<Buffer> {
  const metadata = await sharp(img).metadata();

  if (metadata.width && metadata.height) {
    const width = Math.round(metadata.width * scaleFactor);
    const height = Math.round(metadata.height * scaleFactor);
    return await sharp(img)
      .resize(width, height, { fit: "inside", kernel: sharp.kernel.lanczos3 })
      .png({
        compressionLevel: 9,
        adaptiveFiltering: true,
        palette: true,
      })
      .toBuffer();
  }

  return img;
}


================================================
FILE: packages/evals/utils.ts
================================================
/**
 * This file provides utility functions and classes to assist with evaluation tasks.
 *
 * Key functionalities:
 * - String normalization and fuzzy comparison utility functions to compare output strings
 *   against expected results in a flexible and robust way.
 * - Generation of unique experiment names based on the current timestamp, environment,
 *   and eval name or category.
 */
import fs from "fs";
import { LogLine } from "@browserbasehq/stagehand";
import stringComparison from "string-comparison";
const { jaroWinkler } = stringComparison;

/**
 * normalizeString:
 * Prepares a string for comparison by:
 * - Converting to lowercase
 * - Collapsing multiple spaces to a single space
 * - Removing punctuation and special characters that are not alphabetic or numeric
 * - Normalizing spacing around commas
 * - Trimming leading and trailing whitespace
 *
 * This helps create a stable string representation to compare against expected outputs,
 * even if the actual output contains minor formatting differences.
 */
export function normalizeString(str: string): string {
  return str
    .toLowerCase()
    .replace(/\s+/g, " ")
    .replace(/[;/#!$%^&*:{}=\-_`~()]/g, "")
    .replace(/\s*,\s*/g, ", ")
    .trim();
}

/**
 * compareStrings:
 * Compares two strings (actual vs. expected) using a similarity metric (Jaro-Winkler).
 *
 * Arguments:
 * - actual: The actual output string to be checked.
 * - expected: The expected string we want to match against.
 * - similarityThreshold: A number between 0 and 1. Default is 0.85.
 *   If the computed similarity is greater than or equal to this threshold,
 *   we consider the strings sufficiently similar.
 *
 * Returns:
 * - similarity: A number indicating how similar the two strings are.
 * - meetsThreshold: A boolean indicating if the similarity meets or exceeds the threshold.
 *
 * This function is useful for tasks where exact string matching is too strict,
 * allowing for fuzzy matching that tolerates minor differences in formatting or spelling.
 */
export function compareStrings(
  actual: string,
  expected: string,
  similarityThreshold: number = 0.85,
): { similarity: number; meetsThreshold: boolean } {
  const similarity = jaroWinkler.similarity(
    normalizeString(actual),
    normalizeString(expected),
  );
  return {
    similarity,
    meetsThreshold: similarity >= similarityThreshold,
  };
}

/**
 * generateTimestamp:
 * Generates a timestamp string formatted as "YYYYMMDDHHMMSS".
 * Used to create unique experiment names, ensuring that results can be
 * distinguished by the time they were generated.
 */
export function generateTimestamp(): string {
  const now = new Date();
  return now
    .toISOString()
    .replace(/[-:TZ]/g, "")
    .slice(0, 14);
}

/**
 * generateExperimentName:
 * Creates a unique name for the experiment based on optional evalName or category,
 * the environment (e.g., dev or CI), and the current timestamp.
 * This is used to label the output files and directories.
 */
export function generateExperimentName({
  evalName,
  category,
  environment,
}: {
  evalName?: string;
  category?: string;
  environment: string;
}): string {
  const timestamp = generateTimestamp();
  if (evalName) {
    return `${evalName}_${environment.toLowerCase()}_${timestamp}`;
  }
  if (category) {
    return `${category}_${environment.toLowerCase()}_${timestamp}`;
  }
  return `all_${environment.toLowerCase()}_${timestamp}`;
}

export function logLineToString(logLine: LogLine): string {
  try {
    const timestamp = logLine.timestamp || new Date().toISOString();
    if (logLine.auxiliary?.error) {
      const errorValue = logLine.auxiliary.error?.value ?? "";
      const traceValue = logLine.auxiliary.trace?.value ?? "";
      const traceSuffix = traceValue ? `\n ${traceValue}` : "";
      return `${timestamp}::[stagehand:${logLine.category}] ${logLine.message}\n ${errorValue}${traceSuffix}`;
    }
    return `${timestamp}::[stagehand:${logLine.category}] ${logLine.message} ${
      logLine.auxiliary ? JSON.stringify(logLine.auxiliary) : ""
    }`;
  } catch (error) {
    console.error(`Error logging line:`, error);
    return "error logging line";
  }
}

export function dedent(
  strings: TemplateStringsArray,
  ...values: unknown[]
): string {
  // Interleave raw strings with substitution values
  const raw = strings.raw;
  let result = "";

  for (let i = 0; i < raw.length; i++) {
    result += raw[i]
      // replace newline + any mix of spaces/tabs with “\n”
      .replace(/\n[ \t]+/g, "\n")
      .replace(/^\n/, ""); // remove leading newline
    if (i < values.length) result += values[i];
  }

  // trim trailing/leading blank lines
  return result.trimEnd();
}

// Dataset helpers shared by suites

export function sampleUniform<T>(arr: T[], k: number): T[] {
  const n = arr.length;
  if (k >= n) return arr.slice();
  const copy = arr.slice();
  for (let i = n - 1; i > 0; i--) {
    const j = Math.floor(Math.random() * (i + 1));
    const tmp = copy[i];
    copy[i] = copy[j];
    copy[j] = tmp;
  }
  return copy.slice(0, k);
}

export function readJsonlFile(filePath: string): string[] {
  let lines: string[];
  try {
    const content = fs.readFileSync(filePath, "utf-8");
    lines = content.split(/\r?\n/).filter((l) => l.trim().length > 0);
  } catch (e) {
    console.warn(
      `Could not read file at ${filePath}. Error: ${e instanceof Error ? e.message : String(e)}`,
    );
    lines = [];
  }
  return lines;
}

export function parseJsonlRows<T>(
  lines: string[],
  validator: (parsed: unknown) => parsed is T,
): T[] {
  const candidates: T[] = [];
  for (const line of lines) {
    try {
      const parsed = JSON.parse(line);
      if (validator(parsed)) {
        candidates.push(parsed);
      }
    } catch {
      // skip invalid lines
    }
  }
  return candidates;
}

export function applySampling<T>(
  candidates: T[],
  sampleCount?: number,
  maxCases: number = 25,
): T[] {
  if (sampleCount && sampleCount > 0) {
    return sampleUniform(candidates, sampleCount);
  } else {
    const result: T[] = [];
    for (const candidate of candidates) {
      result.push(candidate);
      if (result.length >= maxCases) break;
    }
    return result;
  }
}


================================================
FILE: packages/server-v3/CHANGELOG.md
================================================
# @browserbasehq/stagehand-server-v3

## 3.6.1

### Patch Changes

- [#1759](https://github.com/browserbase/stagehand/pull/1759) [`505e8c6`](https://github.com/browserbase/stagehand/commit/505e8c6736f3706328dbc8df670c49a018058388) Thanks [@shrey150](https://github.com/shrey150)! - Add bedrock to the provider enum in model configuration schemas and regenerate OpenAPI spec.

- Updated dependencies [[`505e8c6`](https://github.com/browserbase/stagehand/commit/505e8c6736f3706328dbc8df670c49a018058388), [`2f43ffa`](https://github.com/browserbase/stagehand/commit/2f43ffac11778152d17e4c44405770cc32c3ec8c), [`63ee247`](https://github.com/browserbase/stagehand/commit/63ee247ac6bf2992046d4f6b2759f46b15643e36), [`7dc35f5`](https://github.com/browserbase/stagehand/commit/7dc35f5e25689e6518d68b25ef71536d2781c8aa), [`335cf47`](https://github.com/browserbase/stagehand/commit/335cf4730e73bce33e92331d04bda4b0fd42685d), [`6ba0a1d`](https://github.com/browserbase/stagehand/commit/6ba0a1db7fc2d5d5a2f8927b1417d8f1d15eda10), [`4ff3bb8`](https://github.com/browserbase/stagehand/commit/4ff3bb831a6ef6e2d57148e7afb68ea8d23e395d), [`c27054b`](https://github.com/browserbase/stagehand/commit/c27054bbd0508431ade91d655f89efc87bbf5867), [`2abf5b9`](https://github.com/browserbase/stagehand/commit/2abf5b90f1e2bb1442509ef3a686b6128c9cdcf6), [`7817fcc`](https://github.com/browserbase/stagehand/commit/7817fcc315eee4455ce04567cf56c9ec801caf0b), [`7390508`](https://github.com/browserbase/stagehand/commit/73905088c5ed5923d276da9cce2efd0a0a3a46eb), [`611f43a`](https://github.com/browserbase/stagehand/commit/611f43ac8d4c580216d55d2b217c14a9a9c11013), [`521a10e`](https://github.com/browserbase/stagehand/commit/521a10e3698fc5631e219947bc90dad0f8bddaa8), [`2402a3c`](https://github.com/browserbase/stagehand/commit/2402a3c4d50270391b3e6440f4385cdcf5e1eb64)]:
  - @browserbasehq/stagehand@3.2.0

## 3.6.0

### Minor Changes

- [#1611](https://github.com/browserbase/stagehand/pull/1611) [`8a3c066`](https://github.com/browserbase/stagehand/commit/8a3c06600a9ba98485db7e9ed5c3cc43ea180334) Thanks [@monadoid](https://github.com/monadoid)! - Using `mode` enum instead of old `cua` boolean in openapi spec

### Patch Changes

- [#1604](https://github.com/browserbase/stagehand/pull/1604) [`4753078`](https://github.com/browserbase/stagehand/commit/4753078cc9d37cbdb8d1a63dfdb53ccc4b4c2bd2) Thanks [@miguelg719](https://github.com/miguelg719)! - Enable bedrock

- [#1636](https://github.com/browserbase/stagehand/pull/1636) [`ea33052`](https://github.com/browserbase/stagehand/commit/ea330520a325583b71b87d85beb740df4bdb9b2d) Thanks [@miguelg719](https://github.com/miguelg719)! - Include executionModel on the AgentConfigSchema

- [#1602](https://github.com/browserbase/stagehand/pull/1602) [`22a0502`](https://github.com/browserbase/stagehand/commit/22a0502e8b042bef0cfafa32901984a8be9529d8) Thanks [@miguelg719](https://github.com/miguelg719)! - Include vertex as a supported provider

- Updated dependencies [[`7584f3e`](https://github.com/browserbase/stagehand/commit/7584f3e92e60a557d2b3e0e0d2a2af04c3527523), [`1e1c9c1`](https://github.com/browserbase/stagehand/commit/1e1c9c15773e49d5c3cd36021dbc1d23495c1bce), [`6bef890`](https://github.com/browserbase/stagehand/commit/6bef89090ebd231e77d8092b2c32a0f06303d5a9), [`ffd4b33`](https://github.com/browserbase/stagehand/commit/ffd4b335a873d0f4dcd76ea22d44f47919bf8e49), [`677bff5`](https://github.com/browserbase/stagehand/commit/677bff5834c879a2d95f7dbff918b8e1510516b3), [`65ff464`](https://github.com/browserbase/stagehand/commit/65ff464bc13388eb109eba0a2cf533c1cc202854), [`101bcf2`](https://github.com/browserbase/stagehand/commit/101bcf2da8b527fd6ace6aa291ada5d0f2d90344), [`0a94301`](https://github.com/browserbase/stagehand/commit/0a94301caa991d1aa4cdade6e28a065b1aefb3e2), [`b27c04d`](https://github.com/browserbase/stagehand/commit/b27c04d278c290364347acd0c354a878ea9b7c2d), [`afbd08b`](https://github.com/browserbase/stagehand/commit/afbd08bb6367a9c9f65f67e453667987e4659918), [`e3db9aa`](https://github.com/browserbase/stagehand/commit/e3db9aa863f44270792215801fe6e3a02a1321aa), [`0e8d569`](https://github.com/browserbase/stagehand/commit/0e8d5695f662040f7384e64f46301152802e3c62), [`ff0f979`](https://github.com/browserbase/stagehand/commit/ff0f9795f3b2c1cf4f2610a80ebcb3341a24f987), [`2d89d2b`](https://github.com/browserbase/stagehand/commit/2d89d2b35ce812431956b28e0c8b52d32ddc7a27), [`aac9a19`](https://github.com/browserbase/stagehand/commit/aac9a19bdfbe62e4508631337ab0bfbcf8ae62b2), [`06de50f`](https://github.com/browserbase/stagehand/commit/06de50ff377fd31f1b0fcf79adb996d04562d2c0), [`aa4d981`](https://github.com/browserbase/stagehand/commit/aa4d981e440bdd0e3d3f42ccc310d5958aa25cc6), [`18b1e3b`](https://github.com/browserbase/stagehand/commit/18b1e3bd2b16b721845d52fcf1a45c6158e2403f), [`957d82b`](https://github.com/browserbase/stagehand/commit/957d82b9845b4413b123539e81a2e4a490e74a8a), [`b65756e`](https://github.com/browserbase/stagehand/commit/b65756e9e85643055446aa4a51956f7d6627c89f), [`22e371a`](https://github.com/browserbase/stagehand/commit/22e371ae4c25deb6350328fe02832bf2b2197b94), [`d29b91f`](https://github.com/browserbase/stagehand/commit/d29b91fa506636ca36f724fcf106320de54ec3f3), [`7b4f817`](https://github.com/browserbase/stagehand/commit/7b4f817cafb9829ac81c4b5890c318c7f9521fe4), [`176d420`](https://github.com/browserbase/stagehand/commit/176d42002cc0a2c7d13b4c0ffbbd56b70fdc49e8), [`3f9ca4d`](https://github.com/browserbase/stagehand/commit/3f9ca4d9acc109101357378d29cf969168991608), [`8a3c066`](https://github.com/browserbase/stagehand/commit/8a3c06600a9ba98485db7e9ed5c3cc43ea180334), [`49ead1e`](https://github.com/browserbase/stagehand/commit/49ead1e1e8678a8da0f87ad2042491dacc6b01d7), [`3673369`](https://github.com/browserbase/stagehand/commit/36733691f90c15386cf2a7b47d04ef429b7195ae), [`c465e87`](https://github.com/browserbase/stagehand/commit/c465e87ab41942435132c76338518fb3fa8e7896), [`ae533e4`](https://github.com/browserbase/stagehand/commit/ae533e40195181b53833f8055b1259fb360a927b), [`ea33052`](https://github.com/browserbase/stagehand/commit/ea330520a325583b71b87d85beb740df4bdb9b2d), [`5764ede`](https://github.com/browserbase/stagehand/commit/5764edee7aab00ef1aafafb68fc56eb26c0a70b2), [`f09b184`](https://github.com/browserbase/stagehand/commit/f09b184cc5e774736280ae8c94ba3f4f13adda80), [`a7d29de`](https://github.com/browserbase/stagehand/commit/a7d29decee0f7d12e2437267b9eef1795d3b4e3a), [`d334399`](https://github.com/browserbase/stagehand/commit/d3343990041bf9cd5613569840afb0c17131e33c), [`44416da`](https://github.com/browserbase/stagehand/commit/44416da7ff33301bb32d3811e6c3be8782a7d168), [`bdd8b4e`](https://github.com/browserbase/stagehand/commit/bdd8b4ee3c697a02728375510ab7fae764990576)]:
  - @browserbasehq/stagehand@3.1.0

## 3.5.0

### Minor Changes

- [#1578](https://github.com/browserbase/stagehand/pull/1578) [`a5074bd`](https://github.com/browserbase/stagehand/commit/a5074bdda0811140ba7847065c26ac72175cef98) Thanks [@monadoid](https://github.com/monadoid)! - /end endpoint no longer takes an empty object - instead, no request body is required.

### Patch Changes

- Updated dependencies [[`40ce5cc`](https://github.com/browserbase/stagehand/commit/40ce5cc83ec758f4e8c37132a7f4ac8eeea7ca34), [`5506f41`](https://github.com/browserbase/stagehand/commit/5506f416d2609d112b553263984e21d7a30e32b1), [`84c05ca`](https://github.com/browserbase/stagehand/commit/84c05ca8de4587181faf128e5c7464fd960caacc), [`692ffa0`](https://github.com/browserbase/stagehand/commit/692ffa0346ad3d121686aba503c0a22844293efa), [`1ef8901`](https://github.com/browserbase/stagehand/commit/1ef8901e1314e90f43b36be20192e652d3b5598f), [`72ac775`](https://github.com/browserbase/stagehand/commit/72ac775a831d6f0f376ceda4426525f93cc21452), [`3d5af07`](https://github.com/browserbase/stagehand/commit/3d5af07f66d6d26d1f5ac4bd9be7183c3381dd92), [`40e1d80`](https://github.com/browserbase/stagehand/commit/40e1d80776b9216422a25a81070ccb3105e56ec2), [`56c0d24`](https://github.com/browserbase/stagehand/commit/56c0d244f9b2431218bfa832ddfc0587930ae038), [`16d72fb`](https://github.com/browserbase/stagehand/commit/16d72fb4c4081dd33bf45605d75c27644ea4c00e), [`088c4cc`](https://github.com/browserbase/stagehand/commit/088c4cc31dc924bb232a9d5a09ab42cd961c2d36), [`4276f4a`](https://github.com/browserbase/stagehand/commit/4276f4abc8bbde215faac6c0321bf243484c376b), [`6005786`](https://github.com/browserbase/stagehand/commit/600578637e65f6fd18b0cdb322b9e0b857708b2f), [`6fbf5fc`](https://github.com/browserbase/stagehand/commit/6fbf5fc811e5e5d9d22f10c5309fbd336892263a), [`704cf18`](https://github.com/browserbase/stagehand/commit/704cf18cb2bdd187ba06c35f05ccb47317a7668c), [`091296e`](https://github.com/browserbase/stagehand/commit/091296e438bb2374c8bb10ef6c08283978145ebf), [`e56c6eb`](https://github.com/browserbase/stagehand/commit/e56c6eb139bf3aad37e98b16626fff13a6c671d0), [`2cb78d0`](https://github.com/browserbase/stagehand/commit/2cb78d0f5ddef9f7337a9a2fe3137f1421df700a), [`5dad639`](https://github.com/browserbase/stagehand/commit/5dad63938f08d968d434bb1ee2804f1e54fb836a), [`b7c2571`](https://github.com/browserbase/stagehand/commit/b7c2571ad4ac563f3ca0518e1f29a40da93e33bc), [`4c69117`](https://github.com/browserbase/stagehand/commit/4c6911748953199dc9aad3eabe98bcf325f871e4)]:
  - @browserbasehq/stagehand@3.0.8

## 3.2.0

### Minor Changes

- [#1459](https://github.com/browserbase/stagehand/pull/1459) [`abb3469`](https://github.com/browserbase/stagehand/commit/abb3469f51627b318a856fafe6047ff24e681666) Thanks [@monadoid](https://github.com/monadoid)! - Added building of binaries

- [#1457](https://github.com/browserbase/stagehand/pull/1457) [`5fc1281`](https://github.com/browserbase/stagehand/commit/5fc12817a6529d4c59f2e32db92c916095a9a81e) Thanks [@monadoid](https://github.com/monadoid)! - First changeset for stagehand-server

- [#1469](https://github.com/browserbase/stagehand/pull/1469) [`d634d45`](https://github.com/browserbase/stagehand/commit/d634d45a0dbc3a4c876413d94cf4aedace1f56d7) Thanks [@monadoid](https://github.com/monadoid)! - Bump to test binary builds

### Patch Changes

- Updated dependencies [[`0f3991e`](https://github.com/browserbase/stagehand/commit/0f3991eedc0aaff72ef718dda3ddb0839cf4a464), [`e0e22e0`](https://github.com/browserbase/stagehand/commit/e0e22e06bc752a8ffde30f3dbfa58d91e24e6c09), [`f261051`](https://github.com/browserbase/stagehand/commit/f2610517d74774374de9ee93191e663439ef55e5), [`e021674`](https://github.com/browserbase/stagehand/commit/e021674f9641c1c5f9d0c1817c3fdf599eea124d), [`6a5496f`](https://github.com/browserbase/stagehand/commit/6a5496f17dbb716be1ee1aaa4e5ba9d8c723b30b), [`fea1700`](https://github.com/browserbase/stagehand/commit/fea1700552af3319052f463685752501c8e71de3), [`5b288d9`](https://github.com/browserbase/stagehand/commit/5b288d9ac37406ff22460ac8050bea26b87a378e), [`e822f5a`](https://github.com/browserbase/stagehand/commit/e822f5a8898df9eb48ca32c321025f0c74b638f0), [`638efc7`](https://github.com/browserbase/stagehand/commit/638efc7fea401bc43dd05dceedf4c13a3495a728), [`a890f16`](https://github.com/browserbase/stagehand/commit/a890f16fa3a752f308f858e5ab9c9a0faf6b3b34), [`934f492`](https://github.com/browserbase/stagehand/commit/934f492ec587bef81f0ce75b45a35b44ab545712), [`bd2db92`](https://github.com/browserbase/stagehand/commit/bd2db925f66a826d61d58be1611d55646cbdb560), [`51e0170`](https://github.com/browserbase/stagehand/commit/51e01709ce1c947c1947b4e2cb0b1f4f97b77182), [`05f5580`](https://github.com/browserbase/stagehand/commit/05f5580937c3c157550e3c25ae6671f44f562211), [`f56a9c2`](https://github.com/browserbase/stagehand/commit/f56a9c296d4ddce25a405358c66837f8ce4d679f), [`b40ae11`](https://github.com/browserbase/stagehand/commit/b40ae11391af49c3581fce27faa1b7483fc4a169), [`0d2b398`](https://github.com/browserbase/stagehand/commit/0d2b398cd40b32a9ecaf28ede70853036b7c91bd), [`cd01f29`](https://github.com/browserbase/stagehand/commit/cd01f290578eac703521f801ba3712f5332918f3), [`a734fca`](https://github.com/browserbase/stagehand/commit/a734fca0b4573753767d3ebc48ec414baf4f23e1), [`b342acf`](https://github.com/browserbase/stagehand/commit/b342acfaae058127fb57664644c5fd965db02bf2), [`2987cd1`](https://github.com/browserbase/stagehand/commit/2987cd1e5ffabefa9411936609635d4a638faed5), [`dfab1d5`](https://github.com/browserbase/stagehand/commit/dfab1d566299c8c5a63f20565a6da07dc8f61ccd), [`4d71162`](https://github.com/browserbase/stagehand/commit/4d71162beb119635b69b17637564a2bbd0e373e7)]:
  - @browserbasehq/stagehand@3.0.7

## 3.0.6

### Patch Changes

- Updated dependencies [[`605ed6b`](https://github.com/browserbase/stagehand/commit/605ed6b81a3ff8f25d4022f1e5fce6b42aecfc19), [`34e7e5b`](https://github.com/browserbase/stagehand/commit/34e7e5b292f5e6af6efc0da60118663310c5f718), [`943d2d7`](https://github.com/browserbase/stagehand/commit/943d2d79d0f289ac41c9164578f2f1dd876058f2), [`0e95cd2`](https://github.com/browserbase/stagehand/commit/0e95cd2f67672f64f0017024fd47d8b3aef59a95), [`d4237e4`](https://github.com/browserbase/stagehand/commit/d4237e40951ecd10abfdbe766672d498f8806484), [`86975e7`](https://github.com/browserbase/stagehand/commit/86975e795db7505804949a267b20509bd16b5256), [`d5e119b`](https://github.com/browserbase/stagehand/commit/d5e119be5eec84915a79f8d611b6ba0546f48c99), [`4e051b2`](https://github.com/browserbase/stagehand/commit/4e051b23add7ae276b0dbead38b4587838cfc1c1), [`6b5a3c9`](https://github.com/browserbase/stagehand/commit/6b5a3c9035654caaed2da375085b465edda97de4), [`bb85ad9`](https://github.com/browserbase/stagehand/commit/bb85ad912738623a7a866f0cb6e8d5807c6c2738), [`88d28cc`](https://github.com/browserbase/stagehand/commit/88d28cc6f31058d1cf6ec6dc948a4ae77a926b3c), [`45bcef0`](https://github.com/browserbase/stagehand/commit/45bcef0e5788b083f9e38dfd7c3bc63afcd4b6dd), [`6aa9d45`](https://github.com/browserbase/stagehand/commit/6aa9d455aa5836ec2ee8ab2e8b9df3fb218e5381), [`d382084`](https://github.com/browserbase/stagehand/commit/d382084745fff98c3e71413371466394a2625429), [`1df08cc`](https://github.com/browserbase/stagehand/commit/1df08ccb0a2cf73b5c37a91c129721114ff6371c), [`2b56600`](https://github.com/browserbase/stagehand/commit/2b566009606fcbba987260f21b075b318690ce99)]:
  - @browserbasehq/stagehand@3.0.6


================================================
FILE: packages/server-v3/README.md
================================================
# Stagehand API

The Stagehand  is a powerful service that provides a RESTful interface for browser automation and session management using the Browserbase platform. It enables recording, playback, and manipulation of browser sessions with a focus on reliability and performance.

## 📋 Prerequisites

To run the Stagehand API locally, ensure you have the following installed:

- Node.js
- pnpm

## 🛠 Installation

1. Clone the repository:

```bash
git clone https://github.com/browserbase/stagehand/
cd stagehand/packages/server-v3
```

2. Install dependencies:

```bash
pnpm install
```

3. Set up environment variables:

```bash
cp .env.example .env
```

4. Configure your `.env` file with the environment variables required by `src/lib/env.ts` (BB environment, API base URLs, etc.).

5. `pnpm dev`


================================================
FILE: packages/server-v3/SDK_RELEASE_WORKFLOW.md
================================================


================================================
FILE: packages/server-v3/openapi.v3.yaml
================================================
openapi: "3.1.0"
info:
  title: Stagehand API
  version: "3.1.0"
  description: >-
    Stagehand SDK for AI browser automation [ALPHA]. This API allows clients to

    execute browser automation tasks remotely on the Browserbase cloud.

    All endpoints except /sessions/start require an active session ID.

    Responses are streamed using Server-Sent Events (SSE) when the

    `x-stream-response: true` header is provided.


    This SDK is currently ALPHA software and is not production ready!

    Please try it and give us your feedback, stay tuned for upcoming release
    announcements!
  contact:
    name: Browserbase
    url: https://browserbase.com
components:
  securitySchemes:
    BrowserbaseApiKey:
      type: apiKey
      in: header
      name: x-bb-api-key
      description: Browserbase API key for authentication
    BrowserbaseProjectId:
      type: apiKey
      in: header
      name: x-bb-project-id
      description: Browserbase project ID
    ModelApiKey:
      type: apiKey
      in: header
      name: x-model-api-key
      description: API key for the AI model provider (OpenAI, Anthropic, etc.)
  links:
    SessionAct:
      operationId: SessionAct
      parameters:
        id: $response.body#/data/sessionId
      description: Perform an action on the session
    SessionExtract:
      operationId: SessionExtract
      parameters:
        id: $response.body#/data/sessionId
      description: Extract data from the session
    SessionObserve:
      operationId: SessionObserve
      parameters:
        id: $response.body#/data/sessionId
      description: Observe available actions on the session
    SessionNavigate:
      operationId: SessionNavigate
      parameters:
        id: $response.body#/data/sessionId
      description: Navigate to a URL in the session
    SessionAgentExecute:
      operationId: SessionAgentExecute
      parameters:
        id: $response.body#/data/sessionId
      description: Execute an agent on the session
    SessionReplay:
      operationId: SessionReplay
      parameters:
        id: $response.body#/data/sessionId
      description: Replay session metrics
    SessionEnd:
      operationId: SessionEnd
      parameters:
        id: $response.body#/data/sessionId
      description: End the session and release resources
  schemas:
    AgentCacheEntry:
      type: object
      properties:
        cacheKey:
          description: Opaque cache identifier computed from instruction, URL, options,
            and config
          type: string
        entry:
          description: Serialized cache entry that can be written to disk
      required:
        - cacheKey
        - entry
    BrowserbaseRegion:
      type: string
      enum:
        - us-west-2
        - us-east-1
        - eu-central-1
        - ap-southeast-1
    LocalBrowserLaunchOptions:
      type: object
      properties:
        args:
          type: array
          items:
            type: string
        executablePath:
          type: string
        port:
          type: number
        userDataDir:
          type: string
        preserveUserDataDir:
          type: boolean
        headless:
          type: boolean
        devtools:
          type: boolean
        chromiumSandbox:
          type: boolean
        ignoreDefaultArgs:
          anyOf:
            - type: boolean
            - type: array
              items:
                type: string
        proxy:
          type: object
          properties:
            server:
              type: string
            bypass:
              type: string
            username:
              type: string
            password:
              type: string
          required:
            - server
        locale:
          type: string
        viewport:
          type: object
          properties:
            width:
              type: number
            height:
              type: number
          required:
            - width
            - height
        deviceScaleFactor:
          type: number
        hasTouch:
          type: boolean
        ignoreHTTPSErrors:
          type: boolean
        cdpUrl:
          type: string
        cdpHeaders:
          type: object
          propertyNames:
            type: string
          additionalProperties:
            type: string
        connectTimeoutMs:
          type: number
        downloadsPath:
          type: string
        acceptDownloads:
          type: boolean
      additionalProperties: false
    ModelConfigObject:
      type: object
      properties:
        provider:
          description: AI provider for the model (or provide a baseURL endpoint instead)
          example: openai
          type: string
          enum:
            - openai
            - anthropic
            - google
            - microsoft
            - bedrock
        modelName:
          description: Model name string with provider prefix (e.g., 'openai/gpt-5-nano')
          example: openai/gpt-5-nano
          type: string
        apiKey:
          description: API key for the model provider
          example: sk-some-openai-api-key
          type: string
        baseURL:
          description: Base URL for the model provider
          example: https://api.openai.com/v1
          type: string
          format: uri
      required:
        - modelName
    ModelConfig:
      $ref: "#/components/schemas/ModelConfigObject"
    Action:
      description: Action object returned by observe and used by act
      type: object
      properties:
        selector:
          description: CSS selector or XPath for the element
          example: "[data-testid='submit-button']"
          type: string
        description:
          description: Human-readable description of the action
          example: Click the submit button
          type: string
        backendNodeId:
          description: Backend node ID for the element
          type: number
        method:
          description: The method to execute (click, fill, etc.)
          example: click
          type: string
        arguments:
          description: Arguments to pass to the method
          example:
            - Hello World
          type: array
          items:
            type: string
      required:
        - selector
        - description
    BrowserConfig:
      type: object
      properties:
        type:
          description: Browser type to use
          example: local
          type: string
          enum:
            - local
            - browserbase
        cdpUrl:
          description: Chrome DevTools Protocol URL for connecting to existing browser
          example: ws://localhost:9222
          type: string
        launchOptions:
          $ref: "#/components/schemas/LocalBrowserLaunchOptions"
    BrowserbaseViewport:
      type: object
      properties:
        width:
          type: number
        height:
          type: number
    BrowserbaseFingerprintScreen:
      type: object
      properties:
        maxHeight:
          type: number
        maxWidth:
          type: number
        minHeight:
          type: number
        minWidth:
          type: number
    BrowserbaseFingerprint:
      type: object
      properties:
        browsers:
          type: array
          items:
            type: string
            enum:
              - chrome
              - edge
              - firefox
              - safari
        devices:
          type: array
          items:
            type: string
            enum:
              - desktop
              - mobile
        httpVersion:
          type: string
          enum:
            - "1"
            - "2"
        locales:
          type: array
          items:
            type: string
        operatingSystems:
          type: array
          items:
            type: string
            enum:
              - android
              - ios
              - linux
              - macos
              - windows
        screen:
          $ref: "#/components/schemas/BrowserbaseFingerprintScreen"
    BrowserbaseContext:
      type: object
      properties:
        id:
          type: string
        persist:
          type: boolean
      required:
        - id
    BrowserbaseBrowserSettings:
      type: object
      properties:
        advancedStealth:
          type: boolean
        blockAds:
          type: boolean
        context:
          $ref: "#/components/schemas/BrowserbaseContext"
        extensionId:
          type: string
        fingerprint:
          $ref: "#/components/schemas/BrowserbaseFingerprint"
        logSession:
          type: boolean
        recordSession:
          type: boolean
        solveCaptchas:
          type: boolean
        viewport:
          $ref: "#/components/schemas/BrowserbaseViewport"
    BrowserbaseProxyGeolocation:
      type: object
      properties:
        country:
          type: string
        city:
          type: string
        state:
          type: string
      required:
        - country
    BrowserbaseProxyConfig:
      type: object
      properties:
        type:
          type: string
          const: browserbase
        domainPattern:
          type: string
        geolocation:
          $ref: "#/components/schemas/BrowserbaseProxyGeolocation"
      required:
        - type
    ExternalProxyConfig:
      type: object
      properties:
        type:
          type: string
          const: external
        server:
          type: string
        domainPattern:
          type: string
        username:
          type: string
        password:
          type: string
      required:
        - type
        - server
    ProxyConfig:
      oneOf:
        - $ref: "#/components/schemas/BrowserbaseProxyConfig"
        - $ref: "#/components/schemas/ExternalProxyConfig"
      type: object
      discriminator:
        propertyName: type
        mapping:
          browserbase: "#/components/schemas/BrowserbaseProxyConfig"
          external: "#/components/schemas/ExternalProxyConfig"
    BrowserbaseSessionCreateParams:
      type: object
      properties:
        projectId:
          type: string
        browserSettings:
          $ref: "#/components/schemas/BrowserbaseBrowserSettings"
        extensionId:
          type: string
        keepAlive:
          type: boolean
        proxies:
          anyOf:
            - type: boolean
            - type: array
              items:
                $ref: "#/components/schemas/ProxyConfig"
        region:
          $ref: "#/components/schemas/BrowserbaseRegion"
        timeout:
          type: number
        userMetadata:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
    SessionStartRequest:
      type: object
      properties:
        modelName:
          description: Model name to use for AI operations
          example: openai/gpt-4o
          type: string
        domSettleTimeoutMs:
          description: Timeout in ms to wait for DOM to settle
          example: 5000
          type: number
        verbose:
          description: Logging verbosity level (0=quiet, 1=normal, 2=debug)
          example: 1
          type: number
          enum:
            - 0
            - 1
            - 2
        systemPrompt:
          description: Custom system prompt for AI operations
          type: string
        browserbaseSessionCreateParams:
          $ref: "#/components/schemas/BrowserbaseSessionCreateParams"
        browser:
          $ref: "#/components/schemas/BrowserConfig"
        selfHeal:
          description: Enable self-healing for failed actions
          example: true
          type: boolean
        browserbaseSessionID:
          description: Existing Browserbase session ID to resume
          type: string
        experimental:
          type: boolean
        waitForCaptchaSolves:
          description: Wait for captcha solves (deprecated, v2 only)
          type: boolean
        actTimeoutMs:
          description: Timeout in ms for act operations (deprecated, v2 only)
          type: number
      required:
        - modelName
    SessionStartResult:
      type: object
      properties:
        sessionId:
          description: Unique Browserbase session identifier
          example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
          type: string
        cdpUrl:
          description: CDP WebSocket URL for connecting to the Browserbase cloud browser
            (present when available)
          example: wss://connect.browserbase.com/?signingKey=abc123
          anyOf:
            - type: string
            - type: "null"
        available:
          type: boolean
      required:
        - sessionId
        - available
    ActOptions:
      type: object
      properties:
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfig"
            - type: string
        variables:
          description: Variables to substitute in the action instruction
          example:
            username: john_doe
          type: object
          propertyNames:
            type: string
          additionalProperties:
            type: string
        timeout:
          description: Timeout in ms for the action
          example: 30000
          type: number
    ActRequest:
      type: object
      properties:
        input:
          description: Natural language instruction or Action object
          example: Click the login button
          anyOf:
            - type: string
            - $ref: "#/components/schemas/Action"
        options:
          $ref: "#/components/schemas/ActOptions"
        frameId:
          description: Target frame ID for the action
          anyOf:
            - type: string
            - type: "null"
        streamResponse:
          description: Whether to stream the response via SSE
          example: true
          type: boolean
      required:
        - input
    ActResultData:
      type: object
      properties:
        success:
          description: Whether the action completed successfully
          example: true
          type: boolean
        message:
          description: Human-readable result message
          example: Successfully clicked the login button
          type: string
        actionDescription:
          description: Description of the action that was performed
          example: Clicked button with text 'Login'
          type: string
        actions:
          description: List of actions that were executed
          type: array
          items:
            $ref: "#/components/schemas/Action"
      required:
        - success
        - message
        - actionDescription
        - actions
    ActResult:
      type: object
      properties:
        result:
          $ref: "#/components/schemas/ActResultData"
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
    ExtractOptions:
      type: object
      properties:
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfig"
            - type: string
        timeout:
          description: Timeout in ms for the extraction
          example: 30000
          type: number
        selector:
          description: CSS selector to scope extraction to a specific element
          example: "#main-content"
          type: string
    ExtractRequest:
      type: object
      properties:
        instruction:
          description: Natural language instruction for what to extract
          example: Extract all product names and prices from the page
          type: string
        schema:
          description: JSON Schema defining the structure of data to extract
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        options:
          $ref: "#/components/schemas/ExtractOptions"
        frameId:
          description: Target frame ID for the extraction
          anyOf:
            - type: string
            - type: "null"
        streamResponse:
          description: Whether to stream the response via SSE
          example: true
          type: boolean
    ExtractResult:
      type: object
      properties:
        result:
          description: Extracted data matching the requested schema
          x-stainless-any: true
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
    ObserveOptions:
      type: object
      properties:
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfig"
            - type: string
        timeout:
          description: Timeout in ms for the observation
          example: 30000
          type: number
        selector:
          description: CSS selector to scope observation to a specific element
          example: nav
          type: string
    ObserveRequest:
      type: object
      properties:
        instruction:
          description: Natural language instruction for what actions to find
          example: Find all clickable navigation links
          type: string
        options:
          $ref: "#/components/schemas/ObserveOptions"
        frameId:
          description: Target frame ID for the observation
          anyOf:
            - type: string
            - type: "null"
        streamResponse:
          description: Whether to stream the response via SSE
          example: true
          type: boolean
    ObserveResult:
      type: object
      properties:
        result:
          type: array
          items:
            $ref: "#/components/schemas/Action"
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
    AgentConfig:
      type: object
      properties:
        provider:
          description: "AI provider for the agent (legacy, use model: openai/gpt-5-nano
            instead)"
          example: openai
          type: string
          enum:
            - openai
            - anthropic
            - google
            - microsoft
            - bedrock
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfig"
            - type: string
        systemPrompt:
          description: Custom system prompt for the agent
          type: string
        cua:
          description: "Deprecated. Use mode: 'cua' instead. If both are provided, mode
            takes precedence."
          example: true
          type: boolean
        mode:
          description: Tool mode for the agent (dom, hybrid, cua). If set, overrides cua.
          example: cua
          type: string
          enum:
            - dom
            - hybrid
            - cua
        executionModel:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano') for tool execution (observe/act calls within
            agent tools). If not specified, inherits from the main model
            configuration.
          anyOf:
            - $ref: "#/components/schemas/ModelConfig"
            - type: string
    AgentAction:
      type: object
      properties:
        type:
          description: Type of action taken
          example: click
          type: string
        reasoning:
          description: Agent's reasoning for taking this action
          type: string
        taskCompleted:
          type: boolean
        action:
          type: string
        timeMs:
          description: Time taken for this action in ms
          type: number
        pageText:
          type: string
        pageUrl:
          type: string
        instruction:
          type: string
      required:
        - type
      additionalProperties: {}
    AgentUsage:
      type: object
      properties:
        input_tokens:
          example: 1500
          type: number
        output_tokens:
          example: 250
          type: number
        reasoning_tokens:
          type: number
        cached_input_tokens:
          type: number
        inference_time_ms:
          example: 2500
          type: number
      required:
        - input_tokens
        - output_tokens
        - inference_time_ms
    AgentResultData:
      type: object
      properties:
        success:
          description: Whether the agent completed successfully
          example: true
          type: boolean
        message:
          description: Summary of what the agent accomplished
          example: Successfully logged in and navigated to dashboard
          type: string
        actions:
          type: array
          items:
            $ref: "#/components/schemas/AgentAction"
        completed:
          description: Whether the agent finished its task
          example: true
          type: boolean
        metadata:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        usage:
          $ref: "#/components/schemas/AgentUsage"
      required:
        - success
        - message
        - actions
        - completed
    AgentExecuteOptions:
      type: object
      properties:
        instruction:
          description: Natural language instruction for the agent
          example: Log in with username 'demo' and password 'test123', then navigate to
            settings
          type: string
        maxSteps:
          description: Maximum number of steps the agent can take
          example: 20
          type: number
        highlightCursor:
          description: Whether to visually highlight the cursor during execution
          example: true
          type: boolean
        useSearch:
          description: Whether to enable the web search tool powered by Browserbase Search
            API
          example: true
          type: boolean
        toolTimeout:
          description: Timeout in milliseconds for each agent tool call
          example: 30000
          type: number
      required:
        - instruction
    AgentExecuteRequest:
      type: object
      properties:
        agentConfig:
          $ref: "#/components/schemas/AgentConfig"
        executeOptions:
          $ref: "#/components/schemas/AgentExecuteOptions"
        frameId:
          description: Target frame ID for the agent
          anyOf:
            - type: string
            - type: "null"
        streamResponse:
          description: Whether to stream the response via SSE
          example: true
          type: boolean
        shouldCache:
          description: If true, the server captures a cache entry and returns it to the
            client
          type: boolean
      required:
        - agentConfig
        - executeOptions
    AgentExecuteResult:
      type: object
      properties:
        result:
          $ref: "#/components/schemas/AgentResultData"
        cacheEntry:
          $ref: "#/components/schemas/AgentCacheEntry"
      required:
        - result
    NavigateOptions:
      type: object
      properties:
        referer:
          description: Referer header to send with the request
          type: string
        timeout:
          description: Timeout in ms for the navigation
          example: 30000
          type: number
        waitUntil:
          description: When to consider navigation complete
          example: networkidle
          type: string
          enum:
            - load
            - domcontentloaded
            - networkidle
    NavigateRequest:
      type: object
      properties:
        url:
          description: URL to navigate to
          example: https://example.com
          type: string
        options:
          $ref: "#/components/schemas/NavigateOptions"
        frameId:
          description: Target frame ID for the navigation
          anyOf:
            - type: string
            - type: "null"
        streamResponse:
          description: Whether to stream the response via SSE
          example: true
          type: boolean
      required:
        - url
    NavigateResult:
      type: object
      properties:
        result:
          description: Navigation response (Playwright Response object or null)
          anyOf:
            - {}
            - type: "null"
          x-stainless-any: true
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
    TokenUsage:
      type: object
      properties:
        inputTokens:
          type: number
        outputTokens:
          type: number
        timeMs:
          type: number
        cost:
          type: number
    ReplayAction:
      type: object
      properties:
        method:
          type: string
        parameters:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        result:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        timestamp:
          type: number
        endTime:
          type: number
        tokenUsage:
          $ref: "#/components/schemas/TokenUsage"
      required:
        - method
        - parameters
        - result
        - timestamp
    ReplayPage:
      type: object
      properties:
        url:
          type: string
        timestamp:
          type: number
        duration:
          type: number
        actions:
          type: array
          items:
            $ref: "#/components/schemas/ReplayAction"
      required:
        - url
        - timestamp
        - duration
        - actions
    ReplayResult:
      type: object
      properties:
        pages:
          type: array
          items:
            $ref: "#/components/schemas/ReplayPage"
        clientLanguage:
          type: string
      required:
        - pages
    StreamEventStatus:
      description: Current status of the streaming operation
      type: string
      enum:
        - starting
        - connected
        - running
        - finished
        - error
    StreamEventType:
      description: Type of stream event - system events or log messages
      type: string
      enum:
        - system
        - log
    StreamEventSystemData:
      type: object
      properties:
        status:
          $ref: "#/components/schemas/StreamEventStatus"
        result:
          description: Operation result (present when status is 'finished')
          x-stainless-any: true
        error:
          description: Error message (present when status is 'error')
          type: string
      required:
        - status
    StreamEventLogData:
      type: object
      properties:
        status:
          type: string
          const: running
        message:
          description: Log message from the operation
          type: string
      required:
        - status
        - message
    SessionStartResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/SessionStartResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    SessionEndResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
      required:
        - success
      additionalProperties: false
    ActResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/ActResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    ExtractResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/ExtractResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    ObserveResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/ObserveResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    AgentExecuteResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/AgentExecuteResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    NavigateResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/NavigateResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    ReplayResponse:
      type: object
      properties:
        success:
          description: Indicates whether the request was successful
          type: boolean
        data:
          $ref: "#/components/schemas/ReplayResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    AgentCacheEntryOutput:
      type: object
      properties:
        cacheKey:
          description: Opaque cache identifier computed from instruction, URL, options,
            and config
          type: string
        entry:
          description: Serialized cache entry that can be written to disk
      required:
        - cacheKey
        - entry
      additionalProperties: false
    LocalBrowserLaunchOptionsOutput:
      type: object
      properties:
        args:
          type: array
          items:
            type: string
        executablePath:
          type: string
        port:
          type: number
        userDataDir:
          type: string
        preserveUserDataDir:
          type: boolean
        headless:
          type: boolean
        devtools:
          type: boolean
        chromiumSandbox:
          type: boolean
        ignoreDefaultArgs:
          anyOf:
            - type: boolean
            - type: array
              items:
                type: string
        proxy:
          type: object
          properties:
            server:
              type: string
            bypass:
              type: string
            username:
              type: string
            password:
              type: string
          required:
            - server
          additionalProperties: false
        locale:
          type: string
        viewport:
          type: object
          properties:
            width:
              type: number
            height:
              type: number
          required:
            - width
            - height
          additionalProperties: false
        deviceScaleFactor:
          type: number
        hasTouch:
          type: boolean
        ignoreHTTPSErrors:
          type: boolean
        cdpUrl:
          type: string
        cdpHeaders:
          type: object
          propertyNames:
            type: string
          additionalProperties:
            type: string
        connectTimeoutMs:
          type: number
        downloadsPath:
          type: string
        acceptDownloads:
          type: boolean
      additionalProperties: false
    ModelConfigObjectOutput:
      type: object
      properties:
        provider:
          description: AI provider for the model (or provide a baseURL endpoint instead)
          example: openai
          type: string
          enum:
            - openai
            - anthropic
            - google
            - microsoft
            - bedrock
        modelName:
          description: Model name string with provider prefix (e.g., 'openai/gpt-5-nano')
          example: openai/gpt-5-nano
          type: string
        apiKey:
          description: API key for the model provider
          example: sk-some-openai-api-key
          type: string
        baseURL:
          description: Base URL for the model provider
          example: https://api.openai.com/v1
          type: string
          format: uri
      required:
        - modelName
      additionalProperties: false
    ModelConfigOutput:
      $ref: "#/components/schemas/ModelConfigObjectOutput"
    ActionOutput:
      description: Action object returned by observe and used by act
      type: object
      properties:
        selector:
          description: CSS selector or XPath for the element
          example: "[data-testid='submit-button']"
          type: string
        description:
          description: Human-readable description of the action
          example: Click the submit button
          type: string
        backendNodeId:
          description: Backend node ID for the element
          type: number
        method:
          description: The method to execute (click, fill, etc.)
          example: click
          type: string
        arguments:
          description: Arguments to pass to the method
          example:
            - Hello World
          type: array
          items:
            type: string
      required:
        - selector
        - description
      additionalProperties: false
    BrowserConfigOutput:
      type: object
      properties:
        type:
          description: Browser type to use
          example: local
          type: string
          enum:
            - local
            - browserbase
        cdpUrl:
          description: Chrome DevTools Protocol URL for connecting to existing browser
          example: ws://localhost:9222
          type: string
        launchOptions:
          $ref: "#/components/schemas/LocalBrowserLaunchOptionsOutput"
      additionalProperties: false
    BrowserbaseViewportOutput:
      type: object
      properties:
        width:
          type: number
        height:
          type: number
      additionalProperties: false
    BrowserbaseFingerprintScreenOutput:
      type: object
      properties:
        maxHeight:
          type: number
        maxWidth:
          type: number
        minHeight:
          type: number
        minWidth:
          type: number
      additionalProperties: false
    BrowserbaseFingerprintOutput:
      type: object
      properties:
        browsers:
          type: array
          items:
            type: string
            enum:
              - chrome
              - edge
              - firefox
              - safari
        devices:
          type: array
          items:
            type: string
            enum:
              - desktop
              - mobile
        httpVersion:
          type: string
          enum:
            - "1"
            - "2"
        locales:
          type: array
          items:
            type: string
        operatingSystems:
          type: array
          items:
            type: string
            enum:
              - android
              - ios
              - linux
              - macos
              - windows
        screen:
          $ref: "#/components/schemas/BrowserbaseFingerprintScreenOutput"
      additionalProperties: false
    BrowserbaseContextOutput:
      type: object
      properties:
        id:
          type: string
        persist:
          type: boolean
      required:
        - id
      additionalProperties: false
    BrowserbaseBrowserSettingsOutput:
      type: object
      properties:
        advancedStealth:
          type: boolean
        blockAds:
          type: boolean
        context:
          $ref: "#/components/schemas/BrowserbaseContextOutput"
        extensionId:
          type: string
        fingerprint:
          $ref: "#/components/schemas/BrowserbaseFingerprintOutput"
        logSession:
          type: boolean
        recordSession:
          type: boolean
        solveCaptchas:
          type: boolean
        viewport:
          $ref: "#/components/schemas/BrowserbaseViewportOutput"
      additionalProperties: false
    BrowserbaseProxyGeolocationOutput:
      type: object
      properties:
        country:
          type: string
        city:
          type: string
        state:
          type: string
      required:
        - country
      additionalProperties: false
    BrowserbaseProxyConfigOutput:
      type: object
      properties:
        type:
          type: string
          const: browserbase
        domainPattern:
          type: string
        geolocation:
          $ref: "#/components/schemas/BrowserbaseProxyGeolocationOutput"
      required:
        - type
      additionalProperties: false
    ExternalProxyConfigOutput:
      type: object
      properties:
        type:
          type: string
          const: external
        server:
          type: string
        domainPattern:
          type: string
        username:
          type: string
        password:
          type: string
      required:
        - type
        - server
      additionalProperties: false
    ProxyConfigOutput:
      oneOf:
        - $ref: "#/components/schemas/BrowserbaseProxyConfigOutput"
        - $ref: "#/components/schemas/ExternalProxyConfigOutput"
      type: object
      discriminator:
        propertyName: type
        mapping:
          browserbase: "#/components/schemas/BrowserbaseProxyConfigOutput"
          external: "#/components/schemas/ExternalProxyConfigOutput"
    BrowserbaseSessionCreateParamsOutput:
      type: object
      properties:
        projectId:
          type: string
        browserSettings:
          $ref: "#/components/schemas/BrowserbaseBrowserSettingsOutput"
        extensionId:
          type: string
        keepAlive:
          type: boolean
        proxies:
          anyOf:
            - type: boolean
            - type: array
              items:
                $ref: "#/components/schemas/ProxyConfigOutput"
        region:
          $ref: "#/components/schemas/BrowserbaseRegion"
        timeout:
          type: number
        userMetadata:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
      additionalProperties: false
    SessionStartResultOutput:
      type: object
      properties:
        sessionId:
          description: Unique Browserbase session identifier
          example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
          type: string
        cdpUrl:
          description: CDP WebSocket URL for connecting to the Browserbase cloud browser
            (present when available)
          example: wss://connect.browserbase.com/?signingKey=abc123
          anyOf:
            - type: string
            - type: "null"
        available:
          type: boolean
      required:
        - sessionId
        - available
      additionalProperties: false
    ActOptionsOutput:
      type: object
      properties:
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfigOutput"
            - type: string
        variables:
          description: Variables to substitute in the action instruction
          example:
            username: john_doe
          type: object
          propertyNames:
            type: string
          additionalProperties:
            type: string
        timeout:
          description: Timeout in ms for the action
          example: 30000
          type: number
      additionalProperties: false
    ActResultDataOutput:
      type: object
      properties:
        success:
          description: Whether the action completed successfully
          example: true
          type: boolean
        message:
          description: Human-readable result message
          example: Successfully clicked the login button
          type: string
        actionDescription:
          description: Description of the action that was performed
          example: Clicked button with text 'Login'
          type: string
        actions:
          description: List of actions that were executed
          type: array
          items:
            $ref: "#/components/schemas/ActionOutput"
      required:
        - success
        - message
        - actionDescription
        - actions
      additionalProperties: false
    ActResultOutput:
      type: object
      properties:
        result:
          $ref: "#/components/schemas/ActResultDataOutput"
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
      additionalProperties: false
    ExtractOptionsOutput:
      type: object
      properties:
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfigOutput"
            - type: string
        timeout:
          description: Timeout in ms for the extraction
          example: 30000
          type: number
        selector:
          description: CSS selector to scope extraction to a specific element
          example: "#main-content"
          type: string
      additionalProperties: false
    ExtractResultOutput:
      type: object
      properties:
        result:
          description: Extracted data matching the requested schema
          x-stainless-any: true
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
      additionalProperties: false
    ObserveOptionsOutput:
      type: object
      properties:
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfigOutput"
            - type: string
        timeout:
          description: Timeout in ms for the observation
          example: 30000
          type: number
        selector:
          description: CSS selector to scope observation to a specific element
          example: nav
          type: string
      additionalProperties: false
    ObserveResultOutput:
      type: object
      properties:
        result:
          type: array
          items:
            $ref: "#/components/schemas/ActionOutput"
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
      additionalProperties: false
    AgentConfigOutput:
      type: object
      properties:
        provider:
          description: "AI provider for the agent (legacy, use model: openai/gpt-5-nano
            instead)"
          example: openai
          type: string
          enum:
            - openai
            - anthropic
            - google
            - microsoft
            - bedrock
        model:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano')
          anyOf:
            - $ref: "#/components/schemas/ModelConfigOutput"
            - type: string
        systemPrompt:
          description: Custom system prompt for the agent
          type: string
        cua:
          description: "Deprecated. Use mode: 'cua' instead. If both are provided, mode
            takes precedence."
          example: true
          type: boolean
        mode:
          description: Tool mode for the agent (dom, hybrid, cua). If set, overrides cua.
          example: cua
          type: string
          enum:
            - dom
            - hybrid
            - cua
        executionModel:
          description: Model configuration object or model name string (e.g.,
            'openai/gpt-5-nano') for tool execution (observe/act calls within
            agent tools). If not specified, inherits from the main model
            configuration.
          anyOf:
            - $ref: "#/components/schemas/ModelConfigOutput"
            - type: string
      additionalProperties: false
    AgentUsageOutput:
      type: object
      properties:
        input_tokens:
          example: 1500
          type: number
        output_tokens:
          example: 250
          type: number
        reasoning_tokens:
          type: number
        cached_input_tokens:
          type: number
        inference_time_ms:
          example: 2500
          type: number
      required:
        - input_tokens
        - output_tokens
        - inference_time_ms
      additionalProperties: false
    AgentResultDataOutput:
      type: object
      properties:
        success:
          description: Whether the agent completed successfully
          example: true
          type: boolean
        message:
          description: Summary of what the agent accomplished
          example: Successfully logged in and navigated to dashboard
          type: string
        actions:
          type: array
          items:
            $ref: "#/components/schemas/AgentAction"
        completed:
          description: Whether the agent finished its task
          example: true
          type: boolean
        metadata:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        usage:
          $ref: "#/components/schemas/AgentUsageOutput"
      required:
        - success
        - message
        - actions
        - completed
      additionalProperties: false
    AgentExecuteOptionsOutput:
      type: object
      properties:
        instruction:
          description: Natural language instruction for the agent
          example: Log in with username 'demo' and password 'test123', then navigate to
            settings
          type: string
        maxSteps:
          description: Maximum number of steps the agent can take
          example: 20
          type: number
        highlightCursor:
          description: Whether to visually highlight the cursor during execution
          example: true
          type: boolean
        useSearch:
          description: Whether to enable the web search tool powered by Browserbase Search
            API
          example: true
          type: boolean
        toolTimeout:
          description: Timeout in milliseconds for each agent tool call
          example: 30000
          type: number
      required:
        - instruction
      additionalProperties: false
    AgentExecuteResultOutput:
      type: object
      properties:
        result:
          $ref: "#/components/schemas/AgentResultDataOutput"
        cacheEntry:
          $ref: "#/components/schemas/AgentCacheEntryOutput"
      required:
        - result
      additionalProperties: false
    NavigateOptionsOutput:
      type: object
      properties:
        referer:
          description: Referer header to send with the request
          type: string
        timeout:
          description: Timeout in ms for the navigation
          example: 30000
          type: number
        waitUntil:
          description: When to consider navigation complete
          example: networkidle
          type: string
          enum:
            - load
            - domcontentloaded
            - networkidle
      additionalProperties: false
    NavigateResultOutput:
      type: object
      properties:
        result:
          description: Navigation response (Playwright Response object or null)
          anyOf:
            - {}
            - type: "null"
          x-stainless-any: true
        actionId:
          description: Action ID for tracking
          type: string
      required:
        - result
      additionalProperties: false
    TokenUsageOutput:
      type: object
      properties:
        inputTokens:
          type: number
        outputTokens:
          type: number
        timeMs:
          type: number
        cost:
          type: number
      additionalProperties: false
    ReplayActionOutput:
      type: object
      properties:
        method:
          type: string
        parameters:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        result:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
        timestamp:
          type: number
        endTime:
          type: number
        tokenUsage:
          $ref: "#/components/schemas/TokenUsageOutput"
      required:
        - method
        - parameters
        - result
        - timestamp
      additionalProperties: false
    ReplayPageOutput:
      type: object
      properties:
        url:
          type: string
        timestamp:
          type: number
        duration:
          type: number
        actions:
          type: array
          items:
            $ref: "#/components/schemas/ReplayActionOutput"
      required:
        - url
        - timestamp
        - duration
        - actions
      additionalProperties: false
    ReplayResultOutput:
      type: object
      properties:
        pages:
          type: array
          items:
            $ref: "#/components/schemas/ReplayPageOutput"
        clientLanguage:
          type: string
      required:
        - pages
      additionalProperties: false
    StreamEventSystemDataOutput:
      type: object
      properties:
        status:
          $ref: "#/components/schemas/StreamEventStatus"
        result:
          description: Operation result (present when status is 'finished')
          x-stainless-any: true
        error:
          description: Error message (present when status is 'error')
          type: string
      required:
        - status
      additionalProperties: false
    StreamEventLogDataOutput:
      type: object
      properties:
        status:
          type: string
          const: running
        message:
          description: Log message from the operation
          type: string
      required:
        - status
        - message
      additionalProperties: false
    SessionIdParams:
      type: object
      properties:
        id:
          description: Unique session identifier
          example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
          type: string
      required:
        - id
      additionalProperties: false
    SessionHeaders:
      type: object
      properties:
        x-stream-response:
          description: Whether to stream the response via SSE
          example: "true"
          type: string
          enum:
            - "true"
            - "false"
      additionalProperties: false
    ErrorResponse:
      type: object
      properties:
        success:
          type: boolean
          const: false
        error:
          type: string
        code:
          type: string
      required:
        - success
        - error
      additionalProperties: false
    SessionEndResult:
      type: object
      properties: {}
      additionalProperties: false
    StreamEvent:
      description: "Server-Sent Event emitted during streaming responses. Events are
        sent as `data: <JSON>\\n\\n`. Key order: data (with status first), type,
        id."
      type: object
      properties:
        data:
          anyOf:
            - $ref: "#/components/schemas/StreamEventSystemDataOutput"
            - $ref: "#/components/schemas/StreamEventLogDataOutput"
        type:
          $ref: "#/components/schemas/StreamEventType"
        id:
          description: Unique identifier for this event
          example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
          type: string
          format: uuid
          pattern: ^([0-9a-fA-F]{8}-[0-9a-fA-F]{4}-[1-8][0-9a-fA-F]{3}-[89abAB][0-9a-fA-F]{3}-[0-9a-fA-F]{12}|00000000-0000-0000-0000-000000000000|ffffffff-ffff-ffff-ffff-ffffffffffff)$
      required:
        - data
        - type
        - id
      additionalProperties: false
paths:
  /v1/sessions/{id}/act:
    post:
      operationId: SessionAct
      summary: Perform an action
      description: Executes a browser action using natural language instructions or a
        predefined Action object.
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/ActRequest"
        required: true
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/ActResponse"
  /v1/sessions/{id}/end:
    post:
      operationId: SessionEnd
      summary: End a browser session
      description: Terminates the browser session and releases all associated resources.
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/SessionEndResponse"
  /v1/sessions/{id}/extract:
    post:
      operationId: SessionExtract
      summary: Extract data from the page
      description: Extracts structured data from the current page using AI-powered analysis.
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/ExtractRequest"
        required: true
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/ExtractResponse"
  /v1/sessions/{id}/navigate:
    post:
      operationId: SessionNavigate
      summary: Navigate to a URL
      description: Navigates the browser to the specified URL.
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/NavigateRequest"
        required: true
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/NavigateResponse"
  /v1/sessions/{id}/observe:
    post:
      operationId: SessionObserve
      summary: Observe available actions
      description: Identifies and returns available actions on the current page that
        match the given instruction.
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/ObserveRequest"
        required: true
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/ObserveResponse"
  /v1/sessions/{id}/replay:
    get:
      operationId: SessionReplay
      summary: Replay session metrics
      description: Retrieves replay metrics for a session.
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/ReplayResponse"
  /v1/sessions/start:
    post:
      operationId: SessionStart
      summary: Start a new browser session
      description: Creates a new browser session with the specified configuration.
        Returns a session ID used for all subsequent operations.
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/SessionStartRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/SessionStartResponse"
  /v1/sessions/{id}/agentExecute:
    post:
      operationId: SessionAgentExecute
      summary: Execute an AI agent
      description: Runs an autonomous AI agent that can perform complex multi-step
        browser tasks.
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/AgentExecuteRequest"
        required: true
      parameters:
        - schema:
            description: Unique session identifier
            example: c4dbf3a9-9a58-4b22-8a1c-9f20f9f9e123
            type: string
          in: path
          name: id
          required: true
          description: Unique session identifier
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/AgentExecuteResponse"
servers:
  - url: https://api.stagehand.browserbase.com
security:
  - BrowserbaseApiKey: []
    BrowserbaseProjectId: []
    ModelApiKey: []


================================================
FILE: packages/server-v3/package.json
================================================
{
  "name": "@browserbasehq/stagehand-server-v3",
  "version": "3.6.1",
  "description": "Stagehand API server v3",
  "type": "module",
  "private": true,
  "scripts": {
    "build": "pnpm --filter @browserbasehq/stagehand-server-v3 run --parallel \"/^(build:esm-tests|build:server:dist|gen:openapi|build:sea:esm)$/\"",
    "dev": "tsx watch src/server.ts",
    "build:esm-tests": "pnpm -w --dir ../.. exec tsc -p packages/server-v3/tsconfig.tests.json",
    "build:server:dist": "pnpm -w --dir ../.. exec tsc -p packages/server-v3/tsconfig.json && pnpm -w --dir ../.. exec tsc-alias -p packages/server-v3/tsconfig.json",
    "build:sea:esm": "tsx scripts/build-sea.ts --mode=esm",
    "build:sea:cjs": "tsx scripts/build-sea.ts --mode=cjs",
    "lint": "cd ../.. && prettier --check packages/server-v3 && cd packages/server-v3 && eslint . && pnpm run typecheck",
    "typecheck": "pnpm -w --dir ../.. exec tsc -p packages/server-v3/tsconfig.json --noEmit",
    "test": "pnpm -w --dir ../.. exec turbo run test:server --filter=@browserbasehq/stagehand-server-v3 --",
    "test:server": "tsx scripts/test-server.ts",
    "test:integration": "pnpm run test:server -- packages/server-v3/dist/tests/integration",
    "test:integration:local": "STAGEHAND_SERVER_TARGET=local pnpm run test:server -- packages/server-v3/dist/tests/integration",
    "test:integration:sea": "STAGEHAND_SERVER_TARGET=sea pnpm run test:server -- packages/server-v3/dist/tests/integration",
    "gen:openapi": "tsx scripts/gen-openapi.ts"
  },
  "dependencies": {
    "@browserbasehq/sdk": "^2.7.0",
    "@browserbasehq/stagehand": "workspace:*",
    "@fastify/cors": "^11.0.1",
    "@fastify/swagger": "^9.6.1",
    "@fastify/swagger-ui": "^5.2.3",
    "@t3-oss/env-core": "^0.13.8",
    "fastify": "^5.3.2",
    "fastify-metrics": "^12.1.0",
    "fastify-plugin": "^4.5.1",
    "fastify-zod-openapi": "^5.5.0",
    "http-status-codes": "^2.3.0",
    "pino": "^9.7.0",
    "pino-pretty": "^11.3.0",
    "playwright": "1.52.0",
    "uuid": "^11.0.5",
    "zod": "^4.2.1"
  },
  "devDependencies": {
    "@types/node": "22.13.1",
    "eslint": "10.0.2",
    "eslint-plugin-security": "^3.0.1",
    "openai": "4.87.1",
    "postject": "1.0.0-alpha.6",
    "prettier": "^3.2.5",
    "source-map": "^0.7.4",
    "tsc-alias": "^1.8.10",
    "tsx": "*",
    "vitest": "^4.0.8"
  },
  "repository": {
    "type": "git",
    "url": "git+https://github.com/browserbase/stagehand.git",
    "directory": "packages/server-v3"
  },
  "bugs": {
    "url": "https://github.com/browserbase/stagehand/issues"
  },
  "homepage": "https://stagehand.dev"
}


================================================
FILE: packages/server-v3/scripts/build-sea.ts
================================================
#!/usr/bin/env node
/**
 * Build SEA binary from ESM (test) or CJS (release) bundles.
 *
 * Prereqs:
 * - CJS mode: runs core CJS build via Turbo if dist is missing.
 * - ESM mode: core dist/esm available (pnpm run build:esm).
 * - postject installed; tar available for non-Windows downloads.
 *
 * Args: --mode=esm|cjs --target-platform=<platform> --target-arch=<arch> --binary-name=<name>
 * Env: SEA_BUILD_MODE, SEA_TARGET_PLATFORM, SEA_TARGET_ARCH, SEA_BINARY_NAME,
 *      SEA_INCLUDE_SOURCEMAPS.
 * Example: pnpm run build:sea:cjs -- --target-platform=linux --target-arch=arm64
 */
import { spawnSync } from "node:child_process";
import { createHash } from "node:crypto";
import fs from "node:fs";
import os from "node:os";
import path from "node:path";
import https from "node:https";
import { pathToFileURL } from "node:url";
import esbuild from "esbuild";
import { getRepoRootDir } from "./runtimePaths.js";

const repoDir = getRepoRootDir();
const seaFuse = "NODE_SEA_FUSE_fce680ab2cc467b6e072b8b5df1996b2";

const argValue = (name: string) => {
  const prefix = `--${name}=`;
  for (let i = 0; i < process.argv.length; i++) {
    const arg = process.argv[i];
    if (arg === `--${name}` && process.argv[i + 1]) return process.argv[i + 1];
    if (arg.startsWith(prefix)) return arg.slice(prefix.length);
  }
  return undefined;
};

const mode = (
  argValue("mode") ??
  process.env.SEA_BUILD_MODE ??
  "esm"
).toLowerCase();
const parseBoolean = (
  value: string | undefined,
  fallback: boolean,
): boolean => {
  if (value === undefined) return fallback;

  const normalized = value.toLowerCase();
  if (
    normalized === "1" ||
    normalized === "true" ||
    normalized === "yes" ||
    normalized === "on"
  ) {
    return true;
  }
  if (
    normalized === "0" ||
    normalized === "false" ||
    normalized === "no" ||
    normalized === "off"
  ) {
    return false;
  }

  throw new Error(
    `Invalid boolean value "${value}" for --include-sourcemaps / SEA_INCLUDE_SOURCEMAPS`,
  );
};
const targetPlatform =
  argValue("target-platform") ??
  argValue("platform") ??
  process.env.SEA_TARGET_PLATFORM ??
  process.platform;
const targetArch =
  argValue("target-arch") ??
  argValue("arch") ??
  process.env.SEA_TARGET_ARCH ??
  process.arch;
const binaryName =
  argValue("binary-name") ??
  process.env.SEA_BINARY_NAME ??
  `stagehand-server-v3-${targetPlatform}-${targetArch}${targetPlatform === "win32" ? ".exe" : ""}`;
const includeSourcemaps = parseBoolean(
  argValue("include-sourcemaps") ?? process.env.SEA_INCLUDE_SOURCEMAPS,
  false,
);

const run = (cmd: string, args: string[], opts: { cwd?: string } = {}) => {
  const result = spawnSync(cmd, args, { stdio: "inherit", ...opts });
  if (result.error) {
    throw new Error(
      `Command failed to start: ${cmd} ${args.join(" ")}\n${String(result.error)}`,
    );
  }
  if (result.status !== 0) {
    throw new Error(`Command failed: ${cmd} ${args.join(" ")}`);
  }
};

const runNodeScript = (
  scriptPath: string,
  args: string[],
  opts: { cwd?: string } = {},
) => run(process.execPath, [scriptPath, ...args], opts);

const resolveFirstExisting = (paths: string[]): string => {
  for (const candidate of paths) {
    if (fs.existsSync(candidate)) return candidate;
  }
  throw new Error(`Missing tool script. Tried: ${paths.join(", ")}`);
};

const runOptional = (
  cmd: string,
  args: string[],
  opts: { cwd?: string } = {},
) => {
  spawnSync(cmd, args, { stdio: "ignore", ...opts });
};

const hasSeaFuse = (binaryPath: string): boolean => {
  try {
    return fs.readFileSync(binaryPath).includes(Buffer.from(seaFuse));
  } catch {
    return false;
  }
};

const download = (url: string, dest: string): Promise<void> =>
  new Promise((resolve, reject) => {
    https
      .get(url, (res) => {
        if (res.statusCode && res.statusCode >= 300 && res.statusCode < 400) {
          const location = res.headers.location;
          if (!location) {
            reject(new Error(`Redirect without location: ${url}`));
            return;
          }
          res.resume();
          download(location, dest).then(resolve, reject);
          return;
        }
        if (res.statusCode !== 200) {
          reject(new Error(`Download failed (${res.statusCode}) ${url}`));
          res.resume();
          return;
        }

        const file = fs.createWriteStream(dest);
        const fail = (error: Error) => {
          file.destroy();
          reject(error);
        };

        res.on("error", fail);
        file.on("error", fail);
        file.on("finish", () => {
          file.close((closeError) => {
            if (closeError) {
              reject(closeError);
              return;
            }
            resolve();
          });
        });
        res.pipe(file);
      })
      .on("error", reject);
  });

const resolveNodeBinary = async (): Promise<string> => {
  if (targetPlatform !== process.platform) {
    throw new Error(
      `Cross-platform builds are not supported. Host=${process.platform}, target=${targetPlatform}`,
    );
  }
  if (targetArch === process.arch && hasSeaFuse(process.execPath)) {
    return process.execPath;
  }
  if (targetArch === process.arch) {
    console.warn(
      `Current Node binary at ${process.execPath} does not include ${seaFuse}; falling back to the official ${process.version} distribution for SEA injection.`,
    );
  }

  const version = process.version;
  const distPlatform = targetPlatform === "win32" ? "win" : targetPlatform;
  const archiveBase = `node-${version}-${distPlatform}-${targetArch}`;
  const archiveExt = distPlatform === "win" ? "zip" : "tar.xz";
  const tmpRoot = `${os.tmpdir()}/stagehand-server-v3-sea/${archiveBase}`;
  const archivePath = `${tmpRoot}/${archiveBase}.${archiveExt}`;
  const extractRoot = `${tmpRoot}/${archiveBase}`;
  const binaryPath =
    distPlatform === "win"
      ? `${extractRoot}/node.exe`
      : `${extractRoot}/bin/node`;

  if (fs.existsSync(binaryPath)) {
    if (!hasSeaFuse(binaryPath)) {
      throw new Error(
        `Node binary at ${binaryPath} does not include ${seaFuse}; unable to build SEA binary. Delete ${tmpRoot} and retry.`,
      );
    }
    return binaryPath;
  }

  fs.mkdirSync(tmpRoot, { recursive: true });
  if (!fs.existsSync(archivePath)) {
    const url = `https://nodejs.org/dist/${version}/${archiveBase}.${archiveExt}`;
    await download(url, archivePath);
  }

  if (archiveExt === "zip") {
    if (process.platform !== "win32") {
      throw new Error("Windows binaries must be built on Windows runners.");
    }
    run("powershell", [
      "-Command",
      `Expand-Archive -Path '${archivePath}' -DestinationPath '${tmpRoot}' -Force`,
    ]);
  } else {
    run("tar", ["-xf", archivePath, "-C", tmpRoot]);
  }

  if (!fs.existsSync(binaryPath)) {
    throw new Error(`Missing Node binary at ${binaryPath}`);
  }
  if (!hasSeaFuse(binaryPath)) {
    throw new Error(
      `Node binary at ${binaryPath} does not include ${seaFuse}; unable to build SEA binary. Delete ${tmpRoot} and retry.`,
    );
  }
  return binaryPath;
};

const writeSeaConfig = (
  mainPath: string,
  outputPath: string,
  execArgvExtension?: string,
) => {
  const configPath = `${repoDir}/packages/server-v3/dist/sea/sea-config-${mode}.json`;
  const config = {
    main: path
      .relative(`${repoDir}/packages/server-v3`, mainPath)
      .replaceAll("\\", "/"),
    output: path
      .relative(`${repoDir}/packages/server-v3`, outputPath)
      .replaceAll("\\", "/"),
    ...(execArgvExtension ? { execArgvExtension } : {}),
  };
  fs.writeFileSync(configPath, JSON.stringify(config, null, 2));
  return configPath;
};

const buildCjsBundle = () => {
  const turboBin = resolveFirstExisting([
    `${repoDir}/node_modules/turbo/bin/turbo`,
  ]);
  runNodeScript(
    turboBin,
    ["run", "build:cjs", "--filter", "@browserbasehq/stagehand"],
    {
      cwd: repoDir,
    },
  );
  fs.mkdirSync(`${repoDir}/packages/server-v3/dist/sea`, { recursive: true });
  const bundlePath = `${repoDir}/packages/server-v3/dist/sea/bundle.cjs`;
  esbuild.buildSync({
    entryPoints: ["packages/server-v3/src/sea-entry.ts"],
    bundle: true,
    platform: "node",
    format: "cjs",
    outfile: bundlePath,
    logLevel: "warning",
    absWorkingDir: repoDir,
  });
  return bundlePath;
};

const buildEsmBundle = () => {
  if (!fs.existsSync(`${repoDir}/packages/core/dist/esm/index.js`)) {
    throw new Error(
      `Missing ${repoDir}/packages/core/dist/esm/index.js. Run pnpm run build:esm first.`,
    );
  }

  fs.mkdirSync(`${repoDir}/packages/server-v3/dist/sea`, { recursive: true });
  const appBundlePath = `${repoDir}/packages/server-v3/dist/app.mjs`;
  esbuild.buildSync({
    entryPoints: ["packages/server-v3/src/sea-entry.ts"],
    bundle: true,
    platform: "node",
    format: "esm",
    treeShaking: false,
    outfile: appBundlePath,
    alias: {
      "@browserbasehq/stagehand": `${repoDir}/packages/core/dist/esm/index.js`,
    },
    sourcemap: includeSourcemaps ? "inline" : false,
    sourcesContent: includeSourcemaps,
    ...(includeSourcemaps ? { sourceRoot: repoDir } : {}),
    banner: {
      js: 'import { createRequire as __createRequire } from "node:module"; const require = __createRequire(import.meta.url);',
    },
    logLevel: "warning",
    absWorkingDir: repoDir,
  });

  const appSource = fs.readFileSync(appBundlePath, "utf8");
  let finalAppSource = appSource;

  if (includeSourcemaps) {
    const mapMatch = appSource.match(
      /sourceMappingURL=data:application\/json;base64,([A-Za-z0-9+/=]+)\s*$/,
    );
    if (!mapMatch) {
      throw new Error("Missing inline sourcemap in dist/app.mjs");
    }
    const mapJson = Buffer.from(mapMatch[1], "base64").toString("utf8");
    const map = JSON.parse(mapJson) as {
      sourceRoot?: string;
      sources: string[];
      sourcesContent?: string[];
    };
    const toPosix = (value: string) => value.replaceAll("\\", "/");
    const fileUrlToPathSafe = (value: string) => {
      const parsed = new URL(value);
      let pathname = decodeURIComponent(parsed.pathname);
      if (/^\/[A-Za-z]:/.test(pathname)) {
        pathname = pathname.slice(1);
      }
      return pathname;
    };
    const toRepoRelative = (source: string) => {
      let sourcePath = source;
      if (source.startsWith("file://")) {
        sourcePath = fileUrlToPathSafe(source);
      }

      if (path.isAbsolute(sourcePath)) {
        const normalizedSourcePath = toPosix(sourcePath);
        if (normalizedSourcePath.startsWith(`${repoDir}/`)) {
          return toPosix(path.relative(repoDir, normalizedSourcePath));
        }
        return normalizedSourcePath;
      }

      if (sourcePath.startsWith("../src/")) {
        const rel = sourcePath.slice("../src/".length);
        return `packages/server-v3/src/${rel}`;
      }
      if (sourcePath.startsWith("../../core/")) {
        const rel = sourcePath.slice("../../core/".length);
        return `packages/core/${rel}`;
      }
      if (sourcePath.startsWith("../../../node_modules/")) {
        const rel = sourcePath.slice("../../../node_modules/".length);
        return `node_modules/${rel}`;
      }
      if (sourcePath.startsWith("src/")) {
        const rel = sourcePath.slice("src/".length);
        return `packages/server-v3/src/${rel}`;
      }
      if (sourcePath.startsWith("../node_modules/")) {
        const rel = sourcePath.slice("../node_modules/".length);
        return `node_modules/${rel}`;
      }
      if (sourcePath.startsWith("../core/")) {
        const rel = sourcePath.slice("../core/".length);
        return `packages/core/${rel}`;
      }
      if (sourcePath.startsWith("core/")) {
        return `packages/core/${sourcePath.slice("core/".length)}`;
      }
      if (
        sourcePath.startsWith("packages/") ||
        sourcePath.startsWith("node_modules/")
      ) {
        return toPosix(sourcePath);
      }

      const resolved = toPosix(
        path.resolve(`${repoDir}/packages/server-v3`, sourcePath),
      );
      if (resolved.startsWith(`${repoDir}/`)) {
        return toPosix(path.relative(repoDir, resolved));
      }

      return toPosix(sourcePath);
    };

    map.sourceRoot = pathToFileURL(`${repoDir}/`).href;
    map.sources = map.sources.map(toRepoRelative);
    const updatedMap = Buffer.from(JSON.stringify(map)).toString("base64");
    finalAppSource = appSource.replace(mapMatch[1], updatedMap);
    fs.writeFileSync(appBundlePath, finalAppSource);
  }

  const appBytes = Buffer.from(finalAppSource);
  const bundleHash = createHash("sha256")
    .update(appBytes)
    .digest("hex")
    .slice(0, 12);
  const bootstrapPath = `${repoDir}/packages/server-v3/dist/sea/sea-bootstrap.cjs`;
  const bootstrap = `/* eslint-disable */
const fs = require("node:fs");
const os = require("node:os");
const { pathToFileURL } = require("node:url");

const bundleBase64 = ${JSON.stringify(appBytes.toString("base64"))};
const bundleLength = ${appBytes.length};
const bundleHash = ${JSON.stringify(bundleHash)};

const cacheRoot =
  process.env.STAGEHAND_SEA_CACHE_DIR ||
  \`\${os.tmpdir()}/stagehand-server-v3-sea\`;
const cacheDir = \`\${cacheRoot}/\${bundleHash}\`;
const appPath = \`\${cacheDir}/app.mjs\`;

fs.mkdirSync(cacheDir, { recursive: true });
let needsWrite = true;
try {
  const stat = fs.statSync(appPath);
  needsWrite = stat.size !== bundleLength;
} catch {}

if (needsWrite) {
  const tmpPath =
    \`\${cacheDir}/app.mjs.tmp-\${process.pid}-\${Date.now().toString(16)}\`;
  fs.writeFileSync(tmpPath, Buffer.from(bundleBase64, "base64"));
  try {
    fs.renameSync(tmpPath, appPath);
  } catch (err) {
    if (!fs.existsSync(appPath)) throw err;
  }
  try {
    fs.chmodSync(appPath, 0o500);
  } catch {}
}

(async () => {
  await import(pathToFileURL(appPath).href);
})().catch((err) => {
  console.error(err);
  process.exitCode = 1;
});
`;
  fs.writeFileSync(bootstrapPath, bootstrap);
  return bootstrapPath;
};

const main = async () => {
  fs.mkdirSync(`${repoDir}/packages/server-v3/dist/sea`, { recursive: true });

  let mainPath: string;
  let execArgvExtension: string | undefined;

  if (mode === "cjs") {
    mainPath = buildCjsBundle();
  } else if (mode === "esm") {
    mainPath = buildEsmBundle();
    execArgvExtension = "cli";
  } else {
    throw new Error(`Unknown SEA build mode: ${mode}`);
  }

  const seaConfigPath = writeSeaConfig(
    mainPath,
    `${repoDir}/packages/server-v3/dist/sea/sea-prep.blob`,
    execArgvExtension,
  );

  run("node", ["--experimental-sea-config", seaConfigPath], {
    cwd: `${repoDir}/packages/server-v3`,
  });
  if (!fs.existsSync(`${repoDir}/packages/server-v3/dist/sea/sea-prep.blob`)) {
    throw new Error(
      `Missing ${repoDir}/packages/server-v3/dist/sea/sea-prep.blob; SEA blob generation failed.`,
    );
  }

  const nodeBinary = await resolveNodeBinary();
  const outPath = `${repoDir}/packages/server-v3/dist/sea/${binaryName}`;
  fs.copyFileSync(nodeBinary, outPath);
  if (targetPlatform !== "win32") {
    fs.chmodSync(outPath, 0o755);
  }

  if (targetPlatform === "darwin") {
    runOptional("codesign", ["--remove-signature", outPath]);
  }

  const postjectCliPath = resolveFirstExisting([
    `${repoDir}/packages/server-v3/node_modules/postject/dist/cli.js`,
    `${repoDir}/node_modules/postject/dist/cli.js`,
  ]);
  const postjectArgs = [
    outPath,
    "NODE_SEA_BLOB",
    `${repoDir}/packages/server-v3/dist/sea/sea-prep.blob`,
    "--sentinel-fuse",
    seaFuse,
  ];
  if (targetPlatform === "darwin") {
    postjectArgs.push("--macho-segment-name", "NODE_SEA");
  }
  runNodeScript(postjectCliPath, postjectArgs, {
    cwd: `${repoDir}/packages/server-v3`,
  });

  if (targetPlatform === "darwin") {
    runOptional("codesign", ["--sign", "-", outPath]);
  }
};

main().catch((err) => {
  console.error(err instanceof Error ? err.message : String(err));
  process.exit(1);
});


================================================
FILE: packages/server-v3/scripts/gen-openapi.ts
================================================
import { writeFile } from "node:fs/promises";
import path from "node:path";
import { getCurrentDirPath } from "./runtimePaths.js";

import fastify from "fastify";
import fastifySwagger from "@fastify/swagger";
import {
  fastifyZodOpenApiPlugin,
  fastifyZodOpenApiTransformers,
  serializerCompiler,
  validatorCompiler,
  type FastifyZodOpenApiTypeProvider,
} from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

// Routes
import actRoute from "../src/routes/v1/sessions/_id/act.js";
import agentExecuteRoute from "../src/routes/v1/sessions/_id/agentExecute.js";
import endRoute from "../src/routes/v1/sessions/_id/end.js";
import extractRoute from "../src/routes/v1/sessions/_id/extract.js";
import navigateRoute from "../src/routes/v1/sessions/_id/navigate.js";
import observeRoute from "../src/routes/v1/sessions/_id/observe.js";
import replayRoute from "../src/routes/v1/sessions/_id/replay.js";
import startRoute from "../src/routes/v1/sessions/start.js";
import healthcheckRoute from "../src/routes/healthcheck.js";
import readinessRoute from "../src/routes/readiness.js";

const OUTPUT_PATH = path.resolve(getCurrentDirPath(), "../openapi.v3.yaml");

async function main() {
  const app = fastify({
    logger: false,
  }).withTypeProvider<FastifyZodOpenApiTypeProvider>();

  app.setValidatorCompiler(validatorCompiler);
  app.setSerializerCompiler(serializerCompiler);

  // Register all API schemas as components so fastify-zod-openapi can create $ref links
  const components = {
    schemas: {
      // Region support
      BrowserbaseRegion: Api.BrowserbaseRegionSchema,
      // Shared components
      LocalBrowserLaunchOptions: Api.LocalBrowserLaunchOptionsSchema,
      ModelConfigObject: Api.ModelConfigObjectSchema,
      ModelConfig: Api.ModelConfigSchema,
      Action: Api.ActionSchema,
      SessionIdParams: Api.SessionIdParamsSchema,
      BrowserConfig: Api.BrowserConfigSchema,
      SessionHeaders: Api.SessionHeadersSchema,
      ErrorResponse: Api.ErrorResponseSchema,
      // Browserbase schemas
      BrowserbaseViewport: Api.BrowserbaseViewportSchema,
      BrowserbaseFingerprintScreen: Api.BrowserbaseFingerprintScreenSchema,
      BrowserbaseFingerprint: Api.BrowserbaseFingerprintSchema,
      BrowserbaseContext: Api.BrowserbaseContextSchema,
      BrowserbaseBrowserSettings: Api.BrowserbaseBrowserSettingsSchema,
      BrowserbaseProxyGeolocation: Api.BrowserbaseProxyGeolocationSchema,
      BrowserbaseProxyConfig: Api.BrowserbaseProxyConfigSchema,
      ExternalProxyConfig: Api.ExternalProxyConfigSchema,
      ProxyConfig: Api.ProxyConfigSchema,
      BrowserbaseSessionCreateParams: Api.BrowserbaseSessionCreateParamsSchema,
      // Session Start
      SessionStartRequest: Api.SessionStartRequestSchema,
      SessionStartResult: Api.SessionStartResultSchema,
      SessionStartResponse: Api.SessionStartResponseSchema,
      // Session End
      SessionEndResult: Api.SessionEndResultSchema,
      SessionEndResponse: Api.SessionEndResponseSchema,
      // Act
      ActOptions: Api.ActOptionsSchema,
      ActRequest: Api.ActRequestSchema,
      ActResultData: Api.ActResultDataSchema,
      ActResult: Api.ActResultSchema,
      ActResponse: Api.ActResponseSchema,
      // Extract
      ExtractOptions: Api.ExtractOptionsSchema,
      ExtractRequest: Api.ExtractRequestSchema,
      ExtractResult: Api.ExtractResultSchema,
      ExtractResponse: Api.ExtractResponseSchema,
      // Observe
      ObserveOptions: Api.ObserveOptionsSchema,
      ObserveRequest: Api.ObserveRequestSchema,
      ObserveResult: Api.ObserveResultSchema,
      ObserveResponse: Api.ObserveResponseSchema,
      // Agent Execute
      AgentConfig: Api.AgentConfigSchema,
      AgentAction: Api.AgentActionSchema,
      AgentUsage: Api.AgentUsageSchema,
      AgentResultData: Api.AgentResultDataSchema,
      AgentExecuteOptions: Api.AgentExecuteOptionsSchema,
      AgentExecuteRequest: Api.AgentExecuteRequestSchema,
      AgentExecuteResult: Api.AgentExecuteResultSchema,
      AgentExecuteResponse: Api.AgentExecuteResponseSchema,
      // Navigate
      NavigateOptions: Api.NavigateOptionsSchema,
      NavigateRequest: Api.NavigateRequestSchema,
      NavigateResult: Api.NavigateResultSchema,
      NavigateResponse: Api.NavigateResponseSchema,
      // Replay
      TokenUsage: Api.TokenUsageSchema,
      ReplayAction: Api.ReplayActionSchema,
      ReplayPage: Api.ReplayPageSchema,
      ReplayResult: Api.ReplayResultSchema,
      ReplayResponse: Api.ReplayResponseSchema,
      // SSE Stream Events
      StreamEventStatus: Api.StreamEventStatusSchema,
      StreamEventType: Api.StreamEventTypeSchema,
      StreamEventSystemData: Api.StreamEventSystemDataSchema,
      StreamEventLogData: Api.StreamEventLogDataSchema,
      StreamEvent: Api.StreamEventSchema,
    },
  };

  await app.register(fastifyZodOpenApiPlugin, { components });

  await app.register(fastifySwagger, {
    openapi: {
      info: {
        title: "Stagehand API",
        version: "3.1.0",
        description: `Stagehand SDK for AI browser automation [ALPHA]. This API allows clients to
execute browser automation tasks remotely on the Browserbase cloud.
All endpoints except /sessions/start require an active session ID.
Responses are streamed using Server-Sent Events (SSE) when the
\`x-stream-response: true\` header is provided.

This SDK is currently ALPHA software and is not production ready!
Please try it and give us your feedback, stay tuned for upcoming release announcements!`,
        contact: {
          name: "Browserbase",
          url: "https://browserbase.com",
        },
      },
      openapi: "3.1.0",
      servers: [
        {
          url: "https://api.stagehand.browserbase.com",
        },
      ],
      components: {
        securitySchemes: Api.openApiSecuritySchemes,
        links: Api.openApiLinks,
      },
      security: [
        { BrowserbaseApiKey: [], BrowserbaseProjectId: [], ModelApiKey: [] },
      ],
    },
    ...fastifyZodOpenApiTransformers,
  });

  await app.register(
    (instance, _opts, done) => {
      instance.route(actRoute);
      instance.route(endRoute);
      instance.route(extractRoute);
      instance.route(navigateRoute);
      instance.route(observeRoute);
      instance.route(replayRoute);
      instance.route(startRoute);
      instance.route(agentExecuteRoute);
      done();
    },
    { prefix: "/v1" },
  );

  app.route(healthcheckRoute);
  app.route(readinessRoute);

  await app.ready();

  const yaml = app.swagger({ yaml: true });
  // Mintlify expects OpenAPI version fields to be strings, so quote them here.
  const fixedYaml = yaml
    .replace(/^openapi:\s*(?!['"])([^#\s]+)\s*$/m, 'openapi: "$1"')
    .replace(/^ {2}version:\s*(?!['"])([^#\s]+)\s*$/m, '  version: "$1"');

  await writeFile(OUTPUT_PATH, fixedYaml, "utf8");

  await app.close();
  console.log(`OpenAPI spec written to ${OUTPUT_PATH}`);
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});


================================================
FILE: packages/server-v3/scripts/runtimePaths.ts
================================================
/**
 * Keep this file in sync with:
 * - /packages/core/lib/v3/runtimePaths.ts
 * - /packages/server-v3/scripts/runtimePaths.ts
 * - /packages/evals/runtimePaths.ts
 * - /packages/docs/scripts/runtimePaths.js
 */
import path from "node:path";
import { fileURLToPath } from "node:url";
import { createRequire } from "node:module";

const PACKAGE_SEGMENT = "/packages/server-v3/";
const EVAL_FRAMES = new Set(["[eval]", "[eval]-wrapper"]);
const INTERNAL_FRAME_NAMES = new Set([
  "readCallsites",
  "readCallsitePath",
  "resolveCallerFilePath",
  "getCurrentFilePath",
  "getCurrentDirPath",
  "getRepoRootDir",
  "getPackageRootDir",
  "createRequireFromCaller",
  "isMainModule",
]);

const normalizePath = (value: string): string => {
  const input = value.startsWith("file://") ? fileURLToPath(value) : value;
  return path.resolve(input).replaceAll("\\", "/");
};

const readCallsites = (): NodeJS.CallSite[] => {
  const previousPrepare = Error.prepareStackTrace;
  try {
    Error.prepareStackTrace = (_, stack) => stack;
    return (
      (new Error().stack as unknown as NodeJS.CallSite[] | undefined) ?? []
    );
  } finally {
    Error.prepareStackTrace = previousPrepare;
  }
};

type CallSiteWithScriptName = NodeJS.CallSite & {
  getScriptNameOrSourceURL?: () => string | null;
};

const readCallsitePath = (callsite: NodeJS.CallSite): string | null => {
  const callsiteWithScript = callsite as CallSiteWithScriptName;
  const rawPath =
    callsite.getFileName() ?? callsiteWithScript.getScriptNameOrSourceURL?.();
  if (!rawPath) return null;
  if (rawPath.startsWith("node:")) return null;
  if (EVAL_FRAMES.has(rawPath)) return null;
  return normalizePath(rawPath);
};

const isInternalCallsite = (callsite: NodeJS.CallSite): boolean => {
  const functionName = callsite.getFunctionName();
  if (functionName && INTERNAL_FRAME_NAMES.has(functionName)) return true;

  const methodName = callsite.getMethodName();
  if (methodName && INTERNAL_FRAME_NAMES.has(methodName)) return true;

  const callsiteString = callsite.toString();
  for (const frameName of INTERNAL_FRAME_NAMES) {
    if (callsiteString.includes(`${frameName} (`)) return true;
    if (callsiteString.includes(`.${frameName} (`)) return true;
  }
  return false;
};

const resolveCallerFilePath = (): string => {
  const packageCandidates: string[] = [];
  const fallbackCandidates: string[] = [];

  for (const callsite of readCallsites()) {
    const filePath = readCallsitePath(callsite);
    if (!filePath) continue;
    if (isInternalCallsite(callsite)) continue;
    if (filePath.includes(PACKAGE_SEGMENT)) {
      packageCandidates.push(filePath);
      continue;
    }
    fallbackCandidates.push(filePath);
  }

  const packageCandidate = packageCandidates[0];
  if (packageCandidate) return packageCandidate;

  const fallbackCandidate = fallbackCandidates[0];
  if (fallbackCandidate) return fallbackCandidate;

  throw new Error("Unable to resolve caller file path.");
};

export const getCurrentFilePath = (): string => resolveCallerFilePath();

export const getCurrentDirPath = (): string =>
  path.dirname(getCurrentFilePath());

export const getRepoRootDir = (): string => {
  const currentFilePath = getCurrentFilePath();
  const index = currentFilePath.lastIndexOf(PACKAGE_SEGMENT);
  if (index === -1) {
    throw new Error(
      `Unable to determine repo root from ${currentFilePath} (missing ${PACKAGE_SEGMENT}).`,
    );
  }
  return currentFilePath.slice(0, index);
};

export const getPackageRootDir = (): string =>
  `${getRepoRootDir()}${PACKAGE_SEGMENT.slice(0, -1)}`;

export const createRequireFromCaller = () =>
  createRequire(getCurrentFilePath());

export const isMainModule = (): boolean => {
  const entryScript = process.argv.at(1);
  if (!entryScript) return false;
  return normalizePath(entryScript) === getCurrentFilePath();
};


================================================
FILE: packages/server-v3/scripts/test-server.ts
================================================
/**
 * Server unit + integration tests on dist/esm + SEA/local server targets.
 *
 * Prereqs:
 * - pnpm run build (packages/server-v3/dist/tests + packages/server-v3/dist/server.js).
 * - SEA integration still requires build:sea when STAGEHAND_SERVER_TARGET=sea.
 *
 * Args: [test paths...] -- [node --test args...] | --list (prints JSON matrix)
 * Env: STAGEHAND_SERVER_TARGET=sea|local|remote, STAGEHAND_BASE_URL, SEA_BINARY_NAME,
 *      NODE_TEST_CONSOLE_REPORTER, NODE_TEST_REPORTER, NODE_TEST_REPORTER_DESTINATION,
 *      NODE_V8_COVERAGE; writes CTRF to ctrf/node-test-*.xml by default.
 * Example: STAGEHAND_SERVER_TARGET=sea pnpm run test:server -- packages/server-v3/dist/tests/integration/v3/start.test.js
 */
import fs from "node:fs";
import path from "node:path";
import { spawn, spawnSync } from "node:child_process";
import { getRepoRootDir } from "./runtimePaths.js";

const ensureParentDir = (filePath: string) => {
  fs.mkdirSync(path.dirname(filePath), { recursive: true });
};

const splitArgs = (args: string[]) => {
  const tokens = [...args];
  while (tokens[0] === "--") {
    tokens.shift();
  }

  const leadingExtra: string[] = [];
  while (tokens.length > 0 && tokens[0].startsWith("-")) {
    const arg = tokens.shift();
    if (!arg) break;
    if (arg === "--") break;
    leadingExtra.push(arg);
    if (
      !arg.includes("=") &&
      tokens[0] &&
      tokens[0] !== "--" &&
      !tokens[0].startsWith("-")
    ) {
      leadingExtra.push(tokens.shift() as string);
    }
  }

  while (tokens[0] === "--") {
    tokens.shift();
  }

  const separatorIndex = tokens.indexOf("--");
  return {
    paths: separatorIndex === -1 ? tokens : tokens.slice(0, separatorIndex),
    extra: [
      ...leadingExtra,
      ...(separatorIndex === -1 ? [] : tokens.slice(separatorIndex + 1)),
    ],
  };
};

const toSafeName = (name: string) => name.replace(/[\\/]/g, "-");

const collectFiles = (dir: string, suffix: string) => {
  const results: string[] = [];
  const walk = (current: string) => {
    for (const entry of fs.readdirSync(current, { withFileTypes: true })) {
      const full = `${current}/${entry.name}`;
      if (entry.isDirectory()) {
        walk(full);
      } else if (entry.isFile() && entry.name.endsWith(suffix)) {
        results.push(full);
      }
    }
  };
  if (fs.existsSync(dir)) walk(dir);
  return results.sort();
};

const repoRoot = getRepoRootDir();

const writeCtrfFromJunit = (junitPath: string, tool: string) => {
  if (!fs.existsSync(junitPath)) return;
  const stat = fs.statSync(junitPath);
  if (stat.size === 0) return;
  const ctrfPath = junitPath.match(/\.xml$/i)
    ? junitPath.replace(/\.xml$/i, ".json")
    : `${junitPath}.json`;
  const result = spawnSync(
    "pnpm",
    ["exec", "junit-to-ctrf", junitPath, "-o", ctrfPath, "-t", tool],
    { stdio: "inherit", cwd: repoRoot },
  );
  if (result.status !== 0) {
    console.warn(`CTRF conversion failed for ${junitPath}.`);
  }
};

const sourceTestsDir = `${repoRoot}/packages/server-v3/test`;
const sourceUnitDir = `${sourceTestsDir}/unit`;
const sourceIntegrationDir = `${sourceTestsDir}/integration`;
const unitDir = `${repoRoot}/packages/server-v3/dist/tests/unit`;
const integrationDir = `${repoRoot}/packages/server-v3/dist/tests/integration`;
const allTestsDir = `${repoRoot}/packages/server-v3/dist/tests`;

const resolveRepoRelative = (value: string) =>
  path.isAbsolute(value) ? value : path.resolve(repoRoot, value);

const stripNodeReporterArgs = (argsList: string[]) => {
  const filtered: string[] = [];
  let removed = false;
  for (let i = 0; i < argsList.length; i++) {
    const arg = argsList[i];
    if (
      arg === "--test-reporter" ||
      arg.startsWith("--test-reporter=") ||
      arg === "--test-reporter-destination" ||
      arg.startsWith("--test-reporter-destination=")
    ) {
      removed = true;
      if (
        (arg === "--test-reporter" || arg === "--test-reporter-destination") &&
        argsList[i + 1]
      ) {
        i += 1;
      }
      continue;
    }
    filtered.push(arg);
  }
  return { filtered, removed };
};

const toTestName = (testPath: string, root: string) => {
  const abs = resolveRepoRelative(testPath);
  const rel = path.relative(root, abs).replaceAll("\\", "/");
  if (!rel.startsWith("..")) {
    return rel.replace(/\.test\.js$/i, "");
  }
  return path.basename(abs).replace(/\.test\.js$/i, "");
};

const rawArgs = process.argv.slice(2);
const listRequested = rawArgs.includes("--list");

if (listRequested) {
  const unitTests = collectFiles(sourceUnitDir, ".test.ts").map((file) => {
    const relSource = path.relative(sourceTestsDir, file).replaceAll("\\", "/");
    const distPath = `${repoRoot}/packages/server-v3/dist/tests/${relSource.replace(/\.test\.ts$/, ".test.js")}`;
    const name = path.basename(file, ".test.ts");
    return {
      path: path.relative(repoRoot, distPath).replaceAll("\\", "/"),
      name,
      safe_name: toSafeName(name),
    };
  });
  const integrationTests = collectFiles(sourceIntegrationDir, ".test.ts").map(
    (file) => {
      const relSource = path
        .relative(sourceTestsDir, file)
        .replaceAll("\\", "/");
      const distPath = `${repoRoot}/packages/server-v3/dist/tests/${relSource.replace(/\.test\.ts$/, ".test.js")}`;
      const rel = path
        .relative(sourceIntegrationDir, file)
        .replaceAll("\\", "/")
        .replace(/\.test\.ts$/, "");
      return {
        path: path.relative(repoRoot, distPath).replaceAll("\\", "/"),
        name: rel,
        safe_name: toSafeName(rel),
      };
    },
  );
  console.log(JSON.stringify([...unitTests, ...integrationTests]));
  process.exit(0);
}

const { paths, extra } = splitArgs(rawArgs);
const { filtered: extraArgs, removed: removedReporterOverride } =
  stripNodeReporterArgs(extra);
if (removedReporterOverride) {
  console.warn(
    "Ignoring node --test reporter overrides to preserve console + JUnit output.",
  );
}

if (!fs.existsSync(allTestsDir)) {
  console.error(
    "Missing packages/server-v3/dist/tests. Run pnpm run build first.",
  );
  process.exit(1);
}

const serverTarget = (
  process.env.STAGEHAND_SERVER_TARGET ?? "sea"
).toLowerCase();
const explicitBaseUrl = process.env.STAGEHAND_BASE_URL;
const baseUrl = explicitBaseUrl ?? "http://stagehand-api.localhost:3106"; // different than server-v4 to avoid clash

if (serverTarget === "remote" && !explicitBaseUrl) {
  console.error("Missing STAGEHAND_BASE_URL for remote server target.");
  process.exit(1);
}

if (
  serverTarget === "local" &&
  !fs.existsSync(`${repoRoot}/packages/server-v3/dist/server.js`)
) {
  console.error(
    "Missing packages/server-v3/dist/server.js. Run pnpm run build first.",
  );
  process.exit(1);
}

const parsedBaseUrl = new URL(baseUrl);
const port =
  parsedBaseUrl.port || (parsedBaseUrl.protocol === "https:" ? "443" : "80");

process.env.PORT = port;
process.env.STAGEHAND_API_URL = baseUrl;
process.env.BB_ENV = process.env.BB_ENV ?? "local";

const baseNodeOptions = "--enable-source-maps";
const nodeOptions = [process.env.NODE_OPTIONS, baseNodeOptions]
  .filter(Boolean)
  .join(" ");

const allPaths =
  paths.length > 0
    ? paths.map(resolveRepoRelative)
    : [
        ...collectFiles(unitDir, ".test.js"),
        ...collectFiles(integrationDir, ".test.js"),
      ];

const unitPaths = allPaths.filter((p) =>
  p.replaceAll("\\", "/").includes("/packages/server-v3/dist/tests/unit/"),
);
const integrationPaths = allPaths.filter((p) =>
  p
    .replaceAll("\\", "/")
    .includes("/packages/server-v3/dist/tests/integration/"),
);

const singlePath = allPaths.length === 1 ? allPaths[0] : null;
const coverageSuffix =
  singlePath &&
  singlePath.startsWith(`${repoRoot}/packages/server-v3/dist/tests/unit/`)
    ? `server-unit/${path.basename(singlePath).replace(/\.test\.js$/, "")}`
    : singlePath &&
        singlePath.startsWith(
          `${repoRoot}/packages/server-v3/dist/tests/integration/`,
        )
      ? `server-integration/${path
          .relative(integrationDir, singlePath)
          .replace(/\.test\.js$/, "")
          .replaceAll("\\", "/")}`
      : "server";

const coverageRoot = resolveRepoRelative(
  process.env.NODE_V8_COVERAGE ?? `${repoRoot}/coverage/${coverageSuffix}`,
);
const testsCoverage = `${coverageRoot}/tests`;
const serverCoverage = `${coverageRoot}/server`;
fs.mkdirSync(testsCoverage, { recursive: true });
fs.mkdirSync(serverCoverage, { recursive: true });

const consoleReporter = process.env.NODE_TEST_CONSOLE_REPORTER ?? "spec";
const defaultReporter = process.env.NODE_TEST_REPORTER ?? "junit";
const envDestination = process.env.NODE_TEST_REPORTER_DESTINATION
  ? resolveRepoRelative(process.env.NODE_TEST_REPORTER_DESTINATION)
  : null;

const reporterArgsFor = (kind: "unit" | "integration", testName?: string) => {
  const destination =
    envDestination ??
    `${repoRoot}/ctrf/${kind === "unit" ? "server-unit" : "server-integration"}/${testName ? `${testName}.xml` : "all.xml"}`;
  ensureParentDir(destination);
  return {
    args: [
      `--test-reporter=${consoleReporter}`,
      `--test-reporter=${defaultReporter}`,
      "--test-reporter-destination=stdout",
      `--test-reporter-destination=${destination}`,
    ],
    destination,
  };
};

const runNodeTests = (files: string[], reporterArgs: string[]) =>
  spawnSync(
    process.execPath,
    ["--test", ...extraArgs, ...reporterArgs, ...files],
    {
      stdio: "inherit",
      env: {
        ...process.env,
        NODE_OPTIONS: nodeOptions,
        NODE_V8_COVERAGE: testsCoverage,
      },
    },
  );

const waitForServer = async (url: string, timeoutMs = 30_000) => {
  const start = Date.now();
  while (Date.now() - start < timeoutMs) {
    try {
      const controller = new AbortController();
      const timer = setTimeout(() => controller.abort(), 2_000);
      const res = await fetch(url, { signal: controller.signal });
      clearTimeout(timer);
      if (res.ok) return true;
    } catch {
      // retry
    }
    await new Promise((resolve) => setTimeout(resolve, 1_000));
  }
  return false;
};

const startServer = async () => {
  if (serverTarget === "remote") return null;
  if (serverTarget === "local") {
    return spawn(
      process.execPath,
      [`${repoRoot}/packages/server-v3/dist/server.js`],
      {
        stdio: "inherit",
        env: {
          ...process.env,
          NODE_ENV: "development",
          NODE_OPTIONS: nodeOptions,
          NODE_V8_COVERAGE: serverCoverage,
        },
      },
    );
  }

  const defaultName = `stagehand-server-v3-${process.platform}-${process.arch}${process.platform === "win32" ? ".exe" : ""}`;
  const seaBinary = `${repoRoot}/packages/server-v3/dist/sea/${process.env.SEA_BINARY_NAME ?? defaultName}`;

  if (!fs.existsSync(seaBinary)) {
    console.error(`SEA binary not found at ${seaBinary}`);
    process.exit(1);
  }

  return spawn(seaBinary, ["--node-options=--no-lazy --enable-source-maps"], {
    stdio: "inherit",
    env: {
      ...process.env,
      NODE_ENV: "production",
      NODE_V8_COVERAGE: serverCoverage,
      STAGEHAND_SEA_CACHE_DIR:
        process.env.STAGEHAND_SEA_CACHE_DIR ?? `${repoRoot}/.stagehand-sea`,
    },
  });
};

let serverProc: ReturnType<typeof spawn> | null = null;
let status = 0;

if (unitPaths.length > 0) {
  const unitName =
    unitPaths.length === 1 ? toTestName(unitPaths[0], unitDir) : undefined;
  const reporter = reporterArgsFor("unit", unitName);
  const result = runNodeTests(unitPaths, reporter.args);
  status = result.status ?? 1;
  writeCtrfFromJunit(reporter.destination, "node-test");
}

if (status === 0 && integrationPaths.length > 0) {
  serverProc = await startServer();
  const ready = await waitForServer(`${process.env.STAGEHAND_API_URL}/healthz`);
  if (!ready) {
    console.error("Server failed to start within 30 seconds.");
    status = 1;
  } else {
    const integrationName =
      integrationPaths.length === 1
        ? toTestName(integrationPaths[0], integrationDir)
        : undefined;
    const reporter = reporterArgsFor("integration", integrationName);
    const result = runNodeTests(integrationPaths, reporter.args);
    status = result.status ?? 1;
    writeCtrfFromJunit(reporter.destination, "node-test");
  }
}

if (serverProc) {
  serverProc.kill("SIGTERM");
  await new Promise<void>((resolve) => {
    if (serverProc?.exitCode !== null) return resolve();
    const timer = setTimeout(resolve, 10_000);
    serverProc?.once("exit", () => {
      clearTimeout(timer);
      resolve();
    });
  });
  await new Promise((resolve) => setTimeout(resolve, 5_000));
}

process.exit(status);


================================================
FILE: packages/server-v3/src/lib/InMemorySessionStore.ts
================================================
import { randomUUID } from "crypto";
import type { V3Options, LogLine } from "@browserbasehq/stagehand";
import { V3 } from "@browserbasehq/stagehand";
import type {
  SessionStore,
  CreateSessionParams,
  RequestContext,
  SessionCacheConfig,
  SessionStartResult,
} from "./SessionStore.js";

const DEFAULT_MAX_CAPACITY = 100;
const DEFAULT_TTL_MS = 0; // 0 = infinite (no TTL-based eviction)

/**
 * Internal node for LRU linked list
 */
interface LruNode {
  sessionId: string;
  params: CreateSessionParams;
  stagehand: V3 | null;
  loggerRef: { current?: (message: LogLine) => void };
  expiry: number;
  prev: LruNode | null;
  next: LruNode | null;
}

/**
 * In-memory implementation of SessionStore with full caching support.
 *
 * Features:
 * - LRU eviction when at capacity
 * - TTL-based expiration
 * - Lazy V3 instance creation
 * - Dynamic logger updates for streaming
 * - Automatic cleanup of evicted sessions
 *
 * This is the default implementation used when no custom store is provided.
 * For stateless pod architectures, use a database-backed implementation.
 */
export class InMemorySessionStore implements SessionStore {
  private first: LruNode | null = null;
  private last: LruNode | null = null;
  private items: Map<string, LruNode> = new Map();
  private maxCapacity: number;
  private ttlMs: number;
  private cleanupInterval: NodeJS.Timeout | null = null;

  constructor(config?: SessionCacheConfig) {
    this.maxCapacity = config?.maxCapacity ?? DEFAULT_MAX_CAPACITY;
    this.ttlMs = config?.ttlMs ?? DEFAULT_TTL_MS;
    this.startCleanupInterval();
  }

  /**
   * Start periodic cleanup of expired sessions
   */
  private startCleanupInterval(): void {
    // Run cleanup every minute
    this.cleanupInterval = setInterval(() => {
      this.cleanupExpired();
    }, 60_000);
    // Allow process to exit gracefully even if this timer is still active
    this.cleanupInterval.unref();
  }

  /**
   * Cleanup expired sessions
   */
  private async cleanupExpired(): Promise<void> {
    const now = Date.now();
    const expiredIds: string[] = [];

    for (const [sessionId, node] of this.items.entries()) {
      if (this.ttlMs > 0 && node.expiry <= now) {
        expiredIds.push(sessionId);
      }
    }

    for (const sessionId of expiredIds) {
      await this.deleteSession(sessionId);
    }
  }

  /**
   * Bump a node to the end of the LRU list (most recently used)
   */
  private bumpNode(node: LruNode): void {
    // Update expiry
    node.expiry = this.ttlMs > 0 ? Date.now() + this.ttlMs : Infinity;

    if (this.last === node) {
      return; // Already most recent
    }

    const { prev, next } = node;

    // Unlink from current position
    if (prev) prev.next = next;
    if (next) next.prev = prev;
    if (this.first === node) this.first = next;

    // Link to end
    node.prev = this.last;
    node.next = null;
    if (this.last) this.last.next = node;
    this.last = node;

    if (!this.first) this.first = node;
  }

  /**
   * Evict the least recently used session
   */
  private async evictLru(): Promise<void> {
    const lruNode = this.first;
    if (!lruNode) return;

    await this.deleteSession(lruNode.sessionId);
  }

  async startSession(params: CreateSessionParams): Promise<SessionStartResult> {
    // Generate session ID or use provided browserbase session ID
    const sessionId = params.browserbaseSessionID ?? randomUUID();

    // Store the session
    await this.createSession(sessionId, params);

    return {
      sessionId,
      cdpUrl: params.connectUrl ?? "",
      available: true,
    };
  }

  async endSession(sessionId: string): Promise<void> {
    await this.deleteSession(sessionId);
  }

  async hasSession(sessionId: string): Promise<boolean> {
    const node = this.items.get(sessionId);
    if (!node) return false;

    // Check if expired
    if (this.ttlMs > 0 && node.expiry <= Date.now()) {
      await this.deleteSession(sessionId);
      return false;
    }

    return true;
  }

  async getOrCreateStagehand(
    sessionId: string,
    ctx: RequestContext,
  ): Promise<V3> {
    const node = this.items.get(sessionId);

    if (!node) {
      throw new Error(`Session not found: ${sessionId}`);
    }

    // Check if expired
    if (this.ttlMs > 0 && node.expiry <= Date.now()) {
      await this.deleteSession(sessionId);
      throw new Error(`Session expired: ${sessionId}`);
    }

    // Bump to most recently used
    this.bumpNode(node);

    // Update logger reference for this request
    if (ctx.logger) {
      node.loggerRef.current = ctx.logger;
    }

    // If V3 instance exists, return it
    if (node.stagehand) {
      return node.stagehand;
    }

    // Create V3 instance (lazy initialization)
    const options = this.buildV3Options(node.params, ctx, node.loggerRef);
    const stagehand = new V3(options);
    try {
      await stagehand.init();
    } catch (error) {
      try {
        await stagehand.close();
      } catch {
        // best-effort cleanup for failed init attempts
      }
      throw error;
    }
    node.stagehand = stagehand;
    return stagehand;
  }

  /**
   * Build V3Options from stored params and request context
   */
  private buildV3Options(
    params: CreateSessionParams,
    ctx: RequestContext,
    loggerRef: { current?: (message: LogLine) => void },
  ): V3Options {
    const isBrowserbase = params.browserType === "browserbase";

    const options: V3Options = {
      env: isBrowserbase ? "BROWSERBASE" : "LOCAL",
      model: {
        modelName: params.modelName,
        apiKey: ctx.modelApiKey,
      },
      verbose: params.verbose,
      systemPrompt: params.systemPrompt,
      selfHeal: params.selfHeal,
      domSettleTimeout: params.domSettleTimeoutMs,
      experimental: params.experimental,
      // Wrap logger to use the ref so it can be updated per-request
      logger: (message: LogLine) => {
        if (loggerRef.current) {
          loggerRef.current(message);
        }
      },
    };

    if (isBrowserbase) {
      options.apiKey = params.browserbaseApiKey;
      options.projectId = params.browserbaseProjectId;

      if (params.browserbaseSessionID) {
        options.browserbaseSessionID = params.browserbaseSessionID;
      }

      if (params.browserbaseSessionCreateParams) {
        options.browserbaseSessionCreateParams =
          params.browserbaseSessionCreateParams;
      }
    } else if (params.localBrowserLaunchOptions) {
      options.localBrowserLaunchOptions = params.localBrowserLaunchOptions;
    }

    return options;
  }

  async createSession(
    sessionId: string,
    params: CreateSessionParams,
  ): Promise<void> {
    // Check if already exists
    if (this.items.has(sessionId)) {
      throw new Error(`Session already exists: ${sessionId}`);
    }

    // Evict LRU if at capacity
    if (this.maxCapacity > 0 && this.items.size >= this.maxCapacity) {
      await this.evictLru();
    }

    // Create new node
    const node: LruNode = {
      sessionId,
      params,
      stagehand: null, // Lazy initialization
      loggerRef: {},
      expiry: this.ttlMs > 0 ? Date.now() + this.ttlMs : Infinity,
      prev: this.last,
      next: null,
    };

    this.items.set(sessionId, node);

    // Link to end of list
    if (this.last) this.last.next = node;
    this.last = node;
    if (!this.first) this.first = node;
  }

  async deleteSession(sessionId: string): Promise<void> {
    const node = this.items.get(sessionId);
    if (!node) return;

    // Close V3 instance if it exists
    if (node.stagehand) {
      try {
        await node.stagehand.close();
      } catch (error) {
        console.error(
          `Error closing stagehand for session ${sessionId}:`,
          error,
        );
      }
    }

    // Remove from map
    this.items.delete(sessionId);

    // Unlink from list
    const { prev, next } = node;
    if (prev) prev.next = next;
    if (next) next.prev = prev;
    if (this.first === node) this.first = next;
    if (this.last === node) this.last = prev;
  }

  async getSessionConfig(sessionId: string): Promise<CreateSessionParams> {
    const node = this.items.get(sessionId);

    if (!node) {
      throw new Error(`Session not found: ${sessionId}`);
    }

    // Return the stored params (contains browser metadata needed downstream)
    return node.params;
  }

  updateCacheConfig(config: SessionCacheConfig): void {
    if (config.maxCapacity !== undefined) {
      if (config.maxCapacity <= 0) {
        throw new Error("Max capacity must be greater than 0");
      }
      const previousCapacity = this.maxCapacity;
      this.maxCapacity = config.maxCapacity;

      // Evict excess if new capacity is smaller
      if (this.maxCapacity < previousCapacity) {
        const excess = this.items.size - this.maxCapacity;
        for (let i = 0; i < excess; i++) {
          // Fire and forget - don't await to match cloud behavior
          this.evictLru().catch(console.error);
        }
      }
    }

    if (config.ttlMs !== undefined) {
      this.ttlMs = config.ttlMs;
    }
  }

  getCacheConfig(): SessionCacheConfig {
    return {
      maxCapacity: this.maxCapacity,
      ttlMs: this.ttlMs,
    };
  }

  async destroy(): Promise<void> {
    // Stop cleanup interval
    if (this.cleanupInterval) {
      clearInterval(this.cleanupInterval);
      this.cleanupInterval = null;
    }

    // Close all V3 instances
    const sessionIds = Array.from(this.items.keys());
    await Promise.all(sessionIds.map((id) => this.deleteSession(id)));
  }

  /**
   * Get the number of cached sessions
   */
  get size(): number {
    return this.items.size;
  }
}


================================================
FILE: packages/server-v3/src/lib/SessionStore.ts
================================================
import type {
  Api,
  LocalBrowserLaunchOptions,
  LogLine,
  V3,
} from "@browserbasehq/stagehand";

/**
 * Result from SessionStore.startSession().
 */
export type SessionStartResult = Api.SessionStartResult;

/**
 * Parameters for creating a new session.
 * This is what gets persisted - a subset of StartSessionParams
 * that excludes runtime-only values like modelApiKey.
 *
 * Includes cloud-specific fields that pass through to cloud implementations.
 * The library ignores fields it doesn't need, but they're available to SessionStore.
 */
export interface CreateSessionParams {
  /** Browser choice for this session */
  browserType: "local" | "browserbase";
  /** Model name (e.g., "openai/gpt-4o") */
  modelName: string;
  /** Verbosity level */
  verbose?: 0 | 1 | 2;
  /** Custom system prompt */
  systemPrompt?: string;
  /** Enable self-healing for failed actions */
  selfHeal?: boolean;
  /** DOM settle timeout in milliseconds */
  domSettleTimeoutMs?: number;
  /** Enable experimental features */
  experimental?: boolean;

  // Browserbase-specific (used by cloud implementations)
  /** Browserbase API key */
  browserbaseApiKey?: string;
  /** Browserbase project ID */
  browserbaseProjectId?: string;
  /** Existing Browserbase session ID to connect to */
  browserbaseSessionID?: string;
  /** Wait for captcha solves */
  waitForCaptchaSolves?: boolean;
  /** Browserbase session creation params */
  browserbaseSessionCreateParams?: Record<string, unknown>;
  /** Local browser launch overrides when browserType is local */
  localBrowserLaunchOptions?: LocalBrowserLaunchOptions;

  /** WebSocket URL for connecting to the browser (returned to client) */
  connectUrl?: string;

  // Cloud-specific metadata fields
  /** Act timeout in milliseconds */
  actTimeoutMs?: number;
  /** Client language (typescript, python, playground) */
  clientLanguage?: string;
  /** SDK version */
  sdkVersion?: string;
}

/**
 * Request-time context passed when resolving a session.
 * Contains values that come from request headers rather than storage.
 */
export interface RequestContext {
  /** Model API key (from x-model-api-key header) */
  modelApiKey?: string;
  /** Logger function for this request */
  logger?: (message: LogLine) => void;
}

/**
 * Configuration options for session cache behavior.
 */
export interface SessionCacheConfig {
  /** Maximum number of sessions to cache. Default: 100 */
  maxCapacity?: number;
  /** TTL for cached sessions in milliseconds. Default: 300000 (5 minutes) */
  ttlMs?: number;
}

/**
 * SessionStore interface for managing session lifecycle and V3 instances.
 *
 * The library provides an InMemorySessionStore as the default implementation
 * with full caching support (TTL, LRU eviction, etc.).
 *
 * Cloud environments can implement this interface to:
 * - Persist session config to a database
 * - Use custom caching strategies (e.g., LaunchDarkly-driven config)
 * - Add eviction hooks for cleanup
 * - Handle platform-specific session lifecycle (e.g., Browserbase)
 *
 * This enables stateless pod architectures where any pod can handle any request.
 */
export interface SessionStore {
  /**
   * Start a new session.
   *
   * This is the main entry point for session creation. Implementations can:
   * - Create platform-specific resources (e.g., Browserbase session)
   * - Persist session config to storage
   * - Check feature flags for availability
   *
   * @param params - Session configuration
   * @returns Session ID and availability status
   */
  startSession(params: CreateSessionParams): Promise<SessionStartResult>;

  /**
   * End a session and cleanup all resources.
   *
   * This is the main entry point for session cleanup. Implementations can:
   * - Close platform-specific resources (e.g., Browserbase session)
   * - Evict V3 instance from cache
   * - Update session status in storage
   *
   * @param sessionId - The session identifier
   */
  endSession(sessionId: string): Promise<void>;

  /**
   * Check if a session exists.
   * @param sessionId - The session identifier
   * @returns true if the session exists
   */
  hasSession(sessionId: string): Promise<boolean>;

  /**
   * Get or create a V3 instance for a session.
   *
   * This method handles:
   * - Checking the cache for an existing V3 instance
   * - On cache miss: loading config, creating V3, caching it
   * - Updating the logger reference for streaming
   *
   * @param sessionId - The session identifier
   * @param ctx - Request-time context containing values from headers
   * @returns The V3 instance ready for use
   * @throws Error if session not found
   */
  getOrCreateStagehand(sessionId: string, ctx: RequestContext): Promise<V3>;

  /**
   * Create a new session with the given parameters.
   * Lower-level than startSession - just stores the config.
   * @param sessionId - The session identifier
   * @param params - Session configuration to persist
   */
  createSession(sessionId: string, params: CreateSessionParams): Promise<void>;

  /**
   * Delete a session from cache and close V3 instance.
   * Lower-level than endSession - just handles cache cleanup.
   * @param sessionId - The session identifier
   */
  deleteSession(sessionId: string): Promise<void>;

  /**
   * Retrieve the stored session configuration for a given session.
   * @param sessionId - The session identifier
   */
  getSessionConfig(sessionId: string): Promise<CreateSessionParams>;

  /**
   * Update cache configuration dynamically.
   * @param config - New cache configuration values
   */
  updateCacheConfig?(config: SessionCacheConfig): void;

  /**
   * Get current cache configuration.
   * @returns Current cache config
   */
  getCacheConfig?(): SessionCacheConfig;

  /**
   * Cleanup all resources (close all V3 instances, stop timers).
   * Called when shutting down the server.
   */
  destroy(): Promise<void>;
}


================================================
FILE: packages/server-v3/src/lib/auth.ts
================================================
import type { FastifyRequest } from "fastify";

export const authMiddleware = async (
  // eslint-disable-next-line @typescript-eslint/no-unused-vars
  request: FastifyRequest,
): Promise<boolean> => {
  // Authentication is currently disabled; we may re-enable when a real auth backend is wired up.
  return await isAuthenticated();
};

// TODO: Temporarily disable auth until setup in supabase
const isAuthenticated = async (): Promise<boolean> => {
  return true;
};


================================================
FILE: packages/server-v3/src/lib/env.ts
================================================
import { createEnv } from "@t3-oss/env-core";
import { z } from "zod/v4";

// Temporarily defining here until browserbase zod package is updated to 3.25.0+
const bbEnvSchema = z.enum(["local", "dev", "prod"]);

export const env = createEnv({
  server: {
    NODE_ENV: z.enum(["development", "production", "staging", "test"]),
    BB_ENV: bbEnvSchema,
  },
  client: {},
  clientPrefix: "PUBLIC_",
  runtimeEnv: {
    NODE_ENV: process.env.NODE_ENV ?? "production",
    BB_ENV: process.env.BB_ENV ?? "local",
  },
});


================================================
FILE: packages/server-v3/src/lib/errorHandler.ts
================================================
import type {
  FastifyReply,
  FastifyRequest,
  RouteGenericInterface,
} from "fastify";
import { StatusCodes } from "http-status-codes";

import { error } from "./response.js";

export class AppError extends Error {
  statusCode: number;
  isInternal: boolean;

  constructor(
    message: string,
    statusCode = StatusCodes.BAD_REQUEST,
    isInternal = false,
  ) {
    super(message);
    this.statusCode = statusCode;
    this.isInternal = isInternal;
    this.name = this.constructor.name;
    Error.captureStackTrace(this, this.constructor);
  }

  /**
   * Get the message safe to send to clients.
   * For internal errors (5xx), returns generic message.
   * For client errors (4xx), returns actual message.
   */
  getClientMessage(): string {
    if (this.isInternal) {
      return this.statusCode >= StatusCodes.INTERNAL_SERVER_ERROR
        ? "An internal server error occurred"
        : "An error occurred while processing your request";
    }
    return this.message;
  }
}

/**
 * Wraps a route handler with error handling
 * @param handler The route handler to wrap
 * @returns A wrapped route handler that catches errors
 */
export function withErrorHandling<
  T extends RouteGenericInterface = RouteGenericInterface,
  R = unknown,
>(handler: (request: FastifyRequest<T>, reply: FastifyReply) => Promise<R>) {
  return async (
    request: FastifyRequest<T>,
    reply: FastifyReply,
  ): Promise<R | FastifyReply> => {
    try {
      return await handler(request, reply);
    } catch (err) {
      request.log.error(err);

      if (err instanceof AppError) {
        return error(reply, err.getClientMessage(), err.statusCode);
      }

      return error(
        reply,
        "An internal server error occurred",
        StatusCodes.INTERNAL_SERVER_ERROR,
      );
    }
  };
}


================================================
FILE: packages/server-v3/src/lib/header.ts
================================================
import type { FastifyRequest } from "fastify";

import { MissingHeaderError } from "../types/error.js";

export const dangerouslyGetHeader = (
  request: FastifyRequest,
  header: string,
): string => {
  const headerValue = request.headers[header];

  if (!headerValue) {
    throw new MissingHeaderError(header);
  }
  if (Array.isArray(headerValue)) {
    const [value] = headerValue;
    if (!value) {
      throw new MissingHeaderError(header);
    }
    return value;
  }
  return headerValue;
};

export const getOptionalHeader = (
  request: FastifyRequest,
  header: string,
): string | undefined => {
  const headerValue = request.headers[header];
  if (!headerValue) {
    return undefined;
  }
  if (Array.isArray(headerValue)) {
    const [value] = headerValue;
    if (!value) {
      return undefined;
    }
    return value;
  }
  return headerValue;
};

/**
 * Extracts model name from request body, supporting V3 structure.
 * - V3: body.options.model.modelName
 */
export function getModelName(request: FastifyRequest): string | undefined {
  const body = request.body as Record<string, unknown> | undefined;
  const options = body?.options as Record<string, unknown> | undefined;
  const model = options?.model as Record<string, unknown> | undefined;

  if (typeof model?.modelName === "string" && model.modelName) {
    return model.modelName;
  }

  if (typeof body?.modelName === "string" && body.modelName) {
    return body.modelName;
  }

  return undefined;
}

/**
 * Extracts the model API key with precedence:
 * 1. Per-request body apiKey (V3: body.options.model.apiKey)
 * 2. Per-request header x-model-api-key
 */
export function getModelApiKey(request: FastifyRequest): string | undefined {
  const body = request.body as Record<string, unknown> | undefined;
  const options = body?.options as Record<string, unknown> | undefined;
  const model = options?.model as Record<string, unknown> | undefined;

  if (typeof model?.apiKey === "string" && model.apiKey) {
    return model.apiKey;
  }

  return getOptionalHeader(request, "x-model-api-key");
}

/**
 * Extracts the stream response value from either the request header or body.
 * Body parameter takes precedence over header.
 * Defaults to false (non-streaming) if neither is provided.
 */
export function shouldRespondWithSSE(request: FastifyRequest): boolean {
  const body = request.body as Record<string, unknown> | undefined;
  if (typeof body?.streamResponse === "boolean") {
    return body.streamResponse;
  }
  if (typeof body?.streamResponse === "string") {
    return body.streamResponse.toLowerCase() === "true";
  }

  const streamHeader = getOptionalHeader(request, "x-stream-response");
  if (streamHeader) {
    return streamHeader.toLowerCase() === "true";
  }

  return false;
}


================================================
FILE: packages/server-v3/src/lib/logging/index.ts
================================================
import { FastifyInstance } from "fastify";

import { env } from "../../lib/env.js";

// List of routes to ignore for request logging in local environments
const ignoredRoutes = ["/healthz", "/readyz"];

// Helper function to determine if a request should be logged
const shouldLog = (url: string) => {
  return env.BB_ENV !== "local" || !ignoredRoutes.includes(url);
};

const logging = (app: FastifyInstance) => {
  // Add request logging hooks
  app.addHook("onRequest", (req, _reply, done) => {
    // Add request ID to response headers
    if (shouldLog(req.url)) {
      req.log.info(
        {
          req: {
            host: req.hostname,
            method: req.method,
            remoteAddress: req.ip,
            remotePort: req.socket.remotePort,
            url: req.url,
          },
          reqId: req.id,
        },
        "incoming request",
      );
    }
    done();
  });

  app.addHook("onResponse", (req, reply, done) => {
    if (shouldLog(req.url)) {
      req.log.info(
        {
          reqId: req.id,
          req: {
            host: req.hostname,
            method: req.method,
            remoteAddress: req.ip,
            remotePort: req.socket.remotePort,
            url: req.url,
          },
          res: {
            statusCode: reply.statusCode,
          },
          responseTime: reply.elapsedTime,
        },
        "request completed",
      );
    }
    done();
  });
};

export { logging };


================================================
FILE: packages/server-v3/src/lib/response.ts
================================================
import type { FastifyReply } from "fastify";
import { StatusCodes } from "http-status-codes";

interface SuccessResponse<T> {
  success: true;
  data: T;
}

interface ErrorResponse {
  success: false;
  message: string;
}

type ApiResponse<T> = SuccessResponse<T> | ErrorResponse;

export function success<T>(
  reply: FastifyReply,
  data: T,
  status = StatusCodes.OK,
): FastifyReply {
  return reply.status(status).send({
    success: true,
    data,
  });
}

export function error(
  reply: FastifyReply,
  message: string,
  status = StatusCodes.BAD_REQUEST,
): FastifyReply {
  return reply.status(status).send({
    success: false,
    message,
  });
}

export function isSuccessResponse<T>(
  response: ApiResponse<T>,
): response is SuccessResponse<T> {
  return response.success;
}

export function isErrorResponse(
  response: ApiResponse<unknown>,
): response is ErrorResponse {
  return !response.success;
}


================================================
FILE: packages/server-v3/src/lib/sessionStoreManager.ts
================================================
import { InMemorySessionStore } from "./InMemorySessionStore.js";
import type { SessionCacheConfig, SessionStore } from "./SessionStore.js";

let sessionStore: SessionStore | null = null;

export function initializeSessionStore(
  config?: SessionCacheConfig,
): SessionStore {
  if (!sessionStore) {
    sessionStore = new InMemorySessionStore(config);
  }
  return sessionStore;
}

export function getSessionStore(): SessionStore {
  if (!sessionStore) {
    throw new Error("Session store has not been initialized");
  }
  return sessionStore;
}

export async function destroySessionStore(): Promise<void> {
  if (sessionStore) {
    await sessionStore.destroy();
    sessionStore = null;
  }
}


================================================
FILE: packages/server-v3/src/lib/stream.ts
================================================
import type { FastifyReply, FastifyRequest } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { Stagehand as V3Stagehand } from "@browserbasehq/stagehand";
import { v4 } from "uuid";
import { z } from "zod/v4";

import { AppError } from "./errorHandler.js";
import {
  getModelApiKey,
  getModelName,
  getOptionalHeader,
  shouldRespondWithSSE,
} from "./header.js";
import { error, success } from "./response.js";
import { getSessionStore } from "./sessionStoreManager.js";
import type { RequestContext } from "./SessionStore.js";

interface StreamingResponseOptions<TV3> {
  sessionId: string;
  request: FastifyRequest;
  reply: FastifyReply;
  schema: z.ZodType<TV3>;
  handler: (ctx: {
    stagehand: V3Stagehand;
    data: TV3;
  }) => Promise<{ result: unknown; actionId?: string }>;
  operation?: string;
}

export async function createStreamingResponse<TV3>({
  sessionId,
  request,
  reply,
  schema,
  handler,
  operation,
}: StreamingResponseOptions<TV3>) {
  const shouldStreamResponse = shouldRespondWithSSE(request);
  const modelApiKey = getModelApiKey(request);

  const sessionStore = getSessionStore();
  const sessionConfig = await sessionStore.getSessionConfig(sessionId);
  const browserType = sessionConfig.browserType ?? "local";

  let browserbaseApiKey = sessionConfig.browserbaseApiKey;
  let browserbaseProjectId = sessionConfig.browserbaseProjectId;

  if (browserType === "browserbase") {
    browserbaseApiKey =
      browserbaseApiKey ?? getOptionalHeader(request, "x-bb-api-key");
    browserbaseProjectId =
      browserbaseProjectId ?? getOptionalHeader(request, "x-bb-project-id");

    if (!browserbaseApiKey || !browserbaseProjectId) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        error:
          "Browserbase API key and project ID are required for browserbase sessions",
      });
    }
  }

  // Parse data using V3 schema
  let parsedData: TV3;

  try {
    const json: unknown = request.body;
    parsedData = await schema.parseAsync(json);
  } catch (err) {
    const parseError = err as Error | z.ZodError;

    if (parseError instanceof z.ZodError) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        error: parseError.issues.map((issue) => ({
          path: issue.path[0],
          message: issue.message,
        })),
      });
    }

    return reply
      .status(StatusCodes.BAD_REQUEST)
      .send({ error: parseError.message });
  }

  if (shouldStreamResponse) {
    try {
      reply.raw.writeHead(StatusCodes.OK, {
        "Content-Type": "text/event-stream",
        "Cache-Control": "no-cache, no-transform",
        Connection: "keep-alive",
        "Transfer-Encoding": "chunked",
        "X-Accel-Buffering": "no",
        "Access-Control-Allow-Origin": "*",
        "Access-Control-Allow-Methods": "GET, POST, PUT, DELETE, OPTIONS",
        "Access-Control-Allow-Headers": "*",
      });
      // eslint-disable-next-line @typescript-eslint/no-unused-vars
    } catch (_err) {
      return error(
        reply,
        "Failed to write head",
        StatusCodes.INTERNAL_SERVER_ERROR,
      );
    }
  }

  const sendData = (type: string, data: object) => {
    if (!shouldStreamResponse) {
      return;
    }

    reply.raw.write(`data: ${JSON.stringify({ data, type, id: v4() })}\n\n`);
  };

  const actionId = v4();

  sendData("system", { status: "starting" });

  const requestContext: RequestContext = {
    modelApiKey,
    logger: shouldStreamResponse
      ? (message) => {
          sendData("log", { status: "running", message });
        }
      : undefined,
  };

  let stagehand: V3Stagehand;
  try {
    stagehand = (await sessionStore.getOrCreateStagehand(
      sessionId,
      requestContext,
    )) as V3Stagehand;
  } catch (err) {
    const loadError = err instanceof Error ? err : new Error(String(err));

    sendData("system", { status: "error", error: loadError.message });

    if (shouldStreamResponse) {
      reply.raw.end();
      return reply;
    }

    return error(
      reply,
      loadError.message,
      loadError instanceof AppError
        ? loadError.statusCode
        : StatusCodes.INTERNAL_SERVER_ERROR,
    );
  }

  sendData("system", { status: "connected" });

  let result: Awaited<ReturnType<typeof handler>> | null = null;
  let handlerError: Error | null = null;

  try {
    result = await handler({ stagehand, data: parsedData });
  } catch (err) {
    handlerError = err instanceof Error ? err : new Error("Unknown error");
    request.log.error(
      {
        err: handlerError,
        operation: operation ?? "operation",
        sessionId,
        browserType,
        modelName: getModelName(request),
        hasModelApiKey: Boolean(modelApiKey),
        hasBrowserbaseApiKey: Boolean(browserbaseApiKey),
        hasBrowserbaseProjectId: Boolean(browserbaseProjectId),
      },
      "operation handler failed",
    );
  }

  if (handlerError) {
    const clientMessage =
      handlerError instanceof AppError
        ? handlerError.getClientMessage()
        : `${operation ?? "operation"} failed`;

    sendData("system", { status: "error", error: clientMessage });

    if (shouldStreamResponse) {
      reply.raw.end();
      return reply;
    }

    const statusCode =
      handlerError instanceof AppError
        ? handlerError.statusCode
        : StatusCodes.INTERNAL_SERVER_ERROR;
    return error(reply, clientMessage, statusCode);
  }

  sendData("system", {
    status: "finished",
    result: result?.result,
    actionId,
  });

  if (shouldStreamResponse) {
    reply.raw.end();
    return reply;
  }

  return success(reply, { result: result?.result, actionId });
}


================================================
FILE: packages/server-v3/src/lib/utils.ts
================================================
import { StatusCodes } from "http-status-codes";
import { z } from "zod/v3";
import type { ZodTypeAny } from "zod/v3";

import { LegacyModel, LegacyProvider } from "../types/model.js";
import { AppError } from "./errorHandler.js";

interface JSONSchema {
  type?: string | string[];
  properties?: Record<string, JSONSchema>;
  required?: string[];
  description?: string;
  items?: JSONSchema;
  enum?: string[];
  minimum?: number;
  maximum?: number;
  format?: "uri" | "url" | "email" | "uuid";
  anyOf?: JSONSchema[];
  oneOf?: JSONSchema[];
  allOf?: JSONSchema[];
}

/**
 * Converts a JSON Schema object to a Zod schema.
 * @param schema The JSON Schema object to convert
 * @returns A Zod schema equivalent to the input JSON Schema
 */
export function jsonSchemaToZod(schema: JSONSchema): ZodTypeAny {
  if (Array.isArray(schema.type)) {
    const subSchemas = schema.type.map((singleType) => {
      const sub = { ...schema, type: singleType };
      return jsonSchemaToZod(sub);
    });

    if (subSchemas.length === 0) {
      return z.any();
    } else if (subSchemas.length === 1) {
      const [subSchema] = subSchemas;
      if (!subSchema) {
        return z.any();
      }
      return subSchema;
    }
    return z.union(subSchemas as [ZodTypeAny, ZodTypeAny, ...ZodTypeAny[]]);
  }

  if (schema.anyOf && Array.isArray(schema.anyOf)) {
    const subSchemas = schema.anyOf.map((sub) => jsonSchemaToZod(sub));
    if (subSchemas.length === 0) {
      return z.any();
    } else if (subSchemas.length === 1) {
      const [subSchema] = subSchemas;
      if (!subSchema) {
        return z.any();
      }
      return subSchema;
    }
    return z.union(subSchemas as [ZodTypeAny, ZodTypeAny, ...ZodTypeAny[]]);
  }

  if (schema.oneOf && Array.isArray(schema.oneOf)) {
    const subSchemas = schema.oneOf.map((sub) => jsonSchemaToZod(sub));
    if (subSchemas.length === 0) {
      return z.any();
    } else if (subSchemas.length === 1) {
      const [subSchema] = subSchemas;
      if (!subSchema) {
        return z.any();
      }
      return subSchema;
    }
    return z.union(subSchemas as [ZodTypeAny, ZodTypeAny, ...ZodTypeAny[]]);
  }

  switch (schema.type) {
    case "object":
      if (schema.properties) {
        const shape: Record<string, ZodTypeAny> = {};
        for (const key in schema.properties) {
          const subSchema = schema.properties[key];
          if (!subSchema) {
            throw new AppError(
              `Property ${key} is not defined in the schema`,
              StatusCodes.BAD_REQUEST,
            );
          }
          shape[key] = jsonSchemaToZod(subSchema);
        }
        let zodObject = z.object(shape);

        if (schema.required && Array.isArray(schema.required)) {
          const requiredFields = schema.required.reduce<Record<string, true>>(
            (acc, key) => {
              acc[key] = true;
              return acc;
            },
            {},
          );
          zodObject = zodObject.partial().required(requiredFields);
        }

        if (schema.description) {
          zodObject = zodObject.describe(schema.description);
        }
        return zodObject;
      }

      return z.object({});

    case "array":
      if (schema.items) {
        let zodArray = z.array(jsonSchemaToZod(schema.items));
        if (schema.description) {
          zodArray = zodArray.describe(schema.description);
        }
        return zodArray;
      }
      return z.array(z.any());

    case "string": {
      if (schema.enum) {
        return z.string().refine((val) => schema.enum?.includes(val) ?? false);
      }
      let zodString = z.string();

      switch (schema.format) {
        case "uri":
        case "url":
          zodString = zodString.url();
          break;
        case "email":
          zodString = zodString.email();
          break;
        case "uuid":
          zodString = zodString.uuid();
          break;
        default:
      }

      if (schema.description) {
        zodString = zodString.describe(schema.description);
      }
      return zodString;
    }

    case "integer": // integer is a subset of number
    case "number": {
      let zodNumber = z.number();
      if (schema.minimum !== undefined) {
        zodNumber = zodNumber.min(schema.minimum);
      }
      if (schema.maximum !== undefined) {
        zodNumber = zodNumber.max(schema.maximum);
      }
      if (schema.description) {
        zodNumber = zodNumber.describe(schema.description);
      }
      return zodNumber;
    }

    case "boolean": {
      let zodBoolean = z.boolean();
      if (schema.description) {
        zodBoolean = zodBoolean.describe(schema.description);
      }
      return zodBoolean;
    }

    case "null": {
      let zodNull = z.null();
      if (schema.description) {
        zodNull = zodNull.describe(schema.description);
      }
      return zodNull;
    }

    default:
      // fallback if no recognized schema.type is present
      return z.any();
  }
}

// This function is legacy and will not be required after complete AISDK migration
export function mapModelToProvider(model: LegacyModel): LegacyProvider {
  switch (model) {
    case "gpt-4o":
    case "gpt-4o-mini":
    case "gpt-4o-2024-08-06":
    case "gpt-4o-2024-05-13":
    case "o1-mini":
    case "o1-preview":
    case "gpt-4.5-preview":
    case "o3-mini":
      return "openai";
    case "gemini-1.5-flash":
    case "gemini-1.5-pro":
    case "gemini-1.5-flash-8b":
    case "gemini-2.0-flash-lite":
    case "gemini-2.0-flash":
    case "gemini-2.5-pro-preview-03-25":
    case "gemini-2.5-flash-preview-04-17":
      return "google";
    case "cerebras-llama-3.3-70b":
    case "cerebras-llama-3.1-8b":
      throw new AppError(
        "Cerebras models are not supported yet",
        StatusCodes.BAD_REQUEST,
      );
    case "groq-llama-3.3-70b-specdec":
    case "groq-llama-3.3-70b-versatile":
      throw new AppError(
        "Groq models are not supported yet",
        StatusCodes.BAD_REQUEST,
      );
    default: {
      const errorMessage = `Unknown model: ${String(model)}`;
      throw new AppError(errorMessage, StatusCodes.BAD_REQUEST);
    }
  }
}


================================================
FILE: packages/server-v3/src/routes/healthcheck.ts
================================================
import type { RouteOptions } from "fastify";
import { z } from "zod/v4";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import { withErrorHandling } from "../lib/errorHandler.js";

const healthcheckRoute: RouteOptions = {
  method: "GET",
  url: "/healthz",
  logLevel: "silent",
  schema: {
    hide: true, // Hide from OpenAPI spec - utility endpoint
    response: {
      200: z
        .object({
          status: z.string(),
          timestamp: z.string(),
        })
        .strict(),
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: withErrorHandling(async () => {
    return {
      status: "ok",
      timestamp: new Date().toISOString(),
    };
  }),
};

export default healthcheckRoute;


================================================
FILE: packages/server-v3/src/routes/readiness.ts
================================================
import type { RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import { z } from "zod/v4";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import { withErrorHandling } from "../lib/errorHandler.js";

// Server readiness state management
let isReady = false;

/**
 * Get the current readiness state of the server
 * @returns {boolean} Whether the server is ready to accept requests
 */
export const getIsReady = (): boolean => {
  return isReady;
};

/**
 * Mark the server as ready to accept requests
 */
export const setReady = (): void => {
  isReady = true;
};

/**
 * Mark the server as not ready to accept requests
 * Used during graceful shutdown to stop accepting new requests
 */
export const setUnready = (): void => {
  isReady = false;
};

const readinessRoute: RouteOptions = {
  method: "GET",
  url: "/readyz",
  logLevel: "silent",
  schema: {
    hide: true, // Hide from OpenAPI spec - utility endpoint
    response: {
      200: z.string(),
      503: z.string(),
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: withErrorHandling(async (_request, reply) => {
    if (!isReady) {
      return reply
        .code(StatusCodes.SERVICE_UNAVAILABLE)
        .send("Service Unavailable");
    }
    return reply.code(StatusCodes.OK).send("Ready");
  }),
};

export default readinessRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/act.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { ActResult, Action } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { AppError, withErrorHandling } from "../../../../lib/errorHandler.js";
import { createStreamingResponse } from "../../../../lib/stream.js";
import { getSessionStore } from "../../../../lib/sessionStoreManager.js";

const actRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return reply
        .status(StatusCodes.UNAUTHORIZED)
        .send({ error: "Unauthorized" });
    }

    const { id } = request.params as Api.SessionIdParams;

    if (!id.length) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        message: "Missing session id",
      });
    }

    const sessionStore = getSessionStore();
    const hasSession = await sessionStore.hasSession(id);
    if (!hasSession) {
      return reply.status(StatusCodes.NOT_FOUND).send({
        message: "Session not found",
      });
    }

    return createStreamingResponse<Api.ActRequest>({
      sessionId: id,
      request,
      reply,
      schema: Api.ActRequestSchema,
      handler: async ({ stagehand, data }) => {
        const { frameId } = data;
        const page = frameId
          ? stagehand.context.resolvePageByMainFrameId(frameId)
          : await stagehand.context.awaitActivePage();

        if (!page) {
          throw new AppError(
            "Page not found",
            StatusCodes.INTERNAL_SERVER_ERROR,
          );
        }

        const modelOpt = data.options?.model;
        const normalizedModel =
          typeof modelOpt === "string"
            ? { modelName: modelOpt }
            : modelOpt
              ? { ...modelOpt, modelName: modelOpt.modelName ?? "gpt-4o" }
              : undefined;

        const safeOptions = {
          ...data.options,
          model: normalizedModel,
          page,
        };

        let result: ActResult;
        if (typeof data.input === "string") {
          result = await stagehand.act(data.input, safeOptions);
        } else {
          result = await stagehand.act(data.input as Action, safeOptions);
        }

        return { result };
      },
      operation: "act",
    });
  },
);

const actRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/:id/act",
  schema: {
    ...Api.Operations.SessionAct,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    body: Api.ActRequestSchema,
    response: {
      200: Api.ActResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: actRouteHandler,
};

export default actRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/agentExecute.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { AppError, withErrorHandling } from "../../../../lib/errorHandler.js";
import { createStreamingResponse } from "../../../../lib/stream.js";
import { getSessionStore } from "../../../../lib/sessionStoreManager.js";

const agentExecuteRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return reply
        .status(StatusCodes.UNAUTHORIZED)
        .send({ error: "Unauthorized" });
    }

    const { id } = request.params as Api.SessionIdParams;

    if (!id.length) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        message: "Missing session id",
      });
    }

    const sessionStore = getSessionStore();
    const hasSession = await sessionStore.hasSession(id);
    if (!hasSession) {
      return reply.status(StatusCodes.NOT_FOUND).send({
        message: "Session not found",
      });
    }

    return createStreamingResponse<Api.AgentExecuteRequest>({
      sessionId: id,
      request,
      reply,
      schema: Api.AgentExecuteRequestSchema,
      handler: async ({ stagehand, data }) => {
        const { agentConfig, executeOptions } = data;
        const { frameId } = data;
        const page = frameId
          ? stagehand.context.resolvePageByMainFrameId(frameId)
          : await stagehand.context.awaitActivePage();
        if (!page) {
          throw new AppError(
            "Page not found",
            StatusCodes.INTERNAL_SERVER_ERROR,
          );
        }
        const normalizedAgentConfig = {
          ...agentConfig,
          model:
            typeof agentConfig.model === "string"
              ? { modelName: agentConfig.model }
              : agentConfig.model
                ? {
                    ...agentConfig.model,
                    modelName: agentConfig.model.modelName ?? "gpt-4o",
                  }
                : undefined,
        };

        const { instruction, ...restExecuteOptions } = executeOptions;
        const fullExecuteOptions = {
          instruction,
          ...restExecuteOptions,
          page,
        };
        let result;
        try {
          result = await stagehand
            .agent(normalizedAgentConfig)
            .execute(fullExecuteOptions);
        } catch (err) {
          const message = err instanceof Error ? err.message : String(err);
          throw new AppError(message, StatusCodes.UNPROCESSABLE_ENTITY);
        }

        return { result };
      },
      operation: "agentExecute",
    });
  },
);

const agentExecuteRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/:id/agentExecute",
  schema: {
    ...Api.Operations.SessionAgentExecute,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    body: Api.AgentExecuteRequestSchema,
    response: {
      200: Api.AgentExecuteResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: agentExecuteRouteHandler,
};

export default agentExecuteRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/end.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { withErrorHandling } from "../../../../lib/errorHandler.js";
import { error } from "../../../../lib/response.js";
import { getSessionStore } from "../../../../lib/sessionStoreManager.js";

const endRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return error(reply, "Unauthorized", StatusCodes.UNAUTHORIZED);
    }

    // This endpoint intentionally has no request body. Reject unexpected bodies to
    // catch misconfigured clients, while still allowing empty JSON bodies.
    const body = (request as { body?: unknown }).body;
    if (body != null) {
      if (typeof body !== "object" || Buffer.isBuffer(body)) {
        return error(
          reply,
          "Request body must be empty",
          StatusCodes.BAD_REQUEST,
        );
      }

      if (Object.keys(body as Record<string, unknown>).length > 0) {
        return error(
          reply,
          "Request body must be empty",
          StatusCodes.BAD_REQUEST,
        );
      }
    }

    const { id: sessionId } = request.params as Api.SessionIdParams;
    const sessionStore = getSessionStore();
    const hasSession = await sessionStore.hasSession(sessionId);
    if (!hasSession) {
      return error(reply, "Session not found", StatusCodes.NOT_FOUND);
    }
    await sessionStore.endSession(sessionId);

    return reply.status(StatusCodes.OK).send({ success: true });
  },
);

const endRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/:id/end",
  schema: {
    ...Api.Operations.SessionEnd,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    response: {
      200: Api.SessionEndResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: endRouteHandler,
};

export default endRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/extract.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { ZodTypeAny } from "zod/v3";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { AppError, withErrorHandling } from "../../../../lib/errorHandler.js";
import { createStreamingResponse } from "../../../../lib/stream.js";
import { jsonSchemaToZod } from "../../../../lib/utils.js";
import { getSessionStore } from "../../../../lib/sessionStoreManager.js";

const extractRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return reply
        .status(StatusCodes.UNAUTHORIZED)
        .send({ error: "Unauthorized" });
    }

    const { id } = request.params as Api.SessionIdParams;

    if (!id.length) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        message: "Missing session id",
      });
    }

    const sessionStore = getSessionStore();
    const hasSession = await sessionStore.hasSession(id);
    if (!hasSession) {
      return reply.status(StatusCodes.NOT_FOUND).send({
        message: "Session not found",
      });
    }

    return createStreamingResponse<Api.ExtractRequest>({
      sessionId: id,
      request,
      reply,
      schema: Api.ExtractRequestSchema,
      handler: async ({ stagehand, data }) => {
        const { frameId } = data;
        const page = frameId
          ? stagehand.context.resolvePageByMainFrameId(frameId)
          : await stagehand.context.awaitActivePage();

        if (!page) {
          throw new AppError(
            "Page not found",
            StatusCodes.INTERNAL_SERVER_ERROR,
          );
        }

        const modelOpt = data.options?.model;
        const normalizedModel =
          typeof modelOpt === "string"
            ? { modelName: modelOpt }
            : modelOpt
              ? { ...modelOpt, modelName: modelOpt.modelName ?? "gpt-4o" }
              : undefined;

        const safeOptions = {
          ...data.options,
          model: normalizedModel,
          page,
        };

        const extractFn = stagehand.extract.bind(stagehand);

        let result: unknown;

        if (data.instruction) {
          if (data.schema) {
            const zodSchema = jsonSchemaToZod(data.schema) as ZodTypeAny;
            result = await extractFn(data.instruction, zodSchema, safeOptions);
          } else {
            result = await extractFn(data.instruction, safeOptions);
          }
        } else {
          result = await extractFn(safeOptions);
        }

        return { result };
      },
      operation: "extract",
    });
  },
);

const extractRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/:id/extract",
  schema: {
    ...Api.Operations.SessionExtract,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    body: Api.ExtractRequestSchema,
    response: {
      200: Api.ExtractResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: extractRouteHandler,
};

export default extractRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/navigate.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { AppError, withErrorHandling } from "../../../../lib/errorHandler.js";
import { createStreamingResponse } from "../../../../lib/stream.js";
import { getSessionStore } from "../../../../lib/sessionStoreManager.js";

const navigateRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return reply
        .status(StatusCodes.UNAUTHORIZED)
        .send({ error: "Unauthorized" });
    }

    const { id } = request.params as Api.SessionIdParams;

    if (!id.length) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        message: "Missing session id",
      });
    }

    const sessionStore = getSessionStore();
    const hasSession = await sessionStore.hasSession(id);
    if (!hasSession) {
      return reply.status(StatusCodes.NOT_FOUND).send({
        message: "Session not found",
      });
    }

    return createStreamingResponse<Api.NavigateRequest>({
      sessionId: id,
      request,
      reply,
      schema: Api.NavigateRequestSchema,
      handler: async ({ stagehand, data }) => {
        const page = data.frameId
          ? stagehand.context.resolvePageByMainFrameId(data.frameId)
          : await stagehand.context.awaitActivePage();

        if (!page) {
          throw new AppError("Page not found", StatusCodes.NOT_FOUND);
        }

        const result = await page.goto(data.url, data.options);

        return { result };
      },
      operation: "navigate",
    });
  },
);

const navigateRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/:id/navigate",
  schema: {
    ...Api.Operations.SessionNavigate,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    body: Api.NavigateRequestSchema,
    response: {
      200: Api.NavigateResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: navigateRouteHandler,
};

export default navigateRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/observe.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { Action } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { AppError, withErrorHandling } from "../../../../lib/errorHandler.js";
import { createStreamingResponse } from "../../../../lib/stream.js";
import { getSessionStore } from "../../../../lib/sessionStoreManager.js";

const observeRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return reply
        .status(StatusCodes.UNAUTHORIZED)
        .send({ error: "Unauthorized" });
    }

    const { id } = request.params as Api.SessionIdParams;

    if (!id.length) {
      return reply.status(StatusCodes.BAD_REQUEST).send({
        message: "Missing session id",
      });
    }

    const sessionStore = getSessionStore();
    const hasSession = await sessionStore.hasSession(id);
    if (!hasSession) {
      return reply.status(StatusCodes.NOT_FOUND).send({
        message: "Session not found",
      });
    }

    return createStreamingResponse<Api.ObserveRequest>({
      sessionId: id,
      request,
      reply,
      schema: Api.ObserveRequestSchema,
      handler: async ({ stagehand, data }) => {
        const { frameId } = data;
        const page = frameId
          ? stagehand.context.resolvePageByMainFrameId(frameId)
          : await stagehand.context.awaitActivePage();

        if (!page) {
          throw new AppError(
            "Page not found",
            StatusCodes.INTERNAL_SERVER_ERROR,
          );
        }

        const safeOptions = {
          ...data.options,
          model:
            typeof data.options?.model === "string"
              ? { modelName: data.options.model }
              : data.options?.model
                ? {
                    ...data.options.model,
                    modelName: data.options.model.modelName ?? "gpt-4o",
                  }
                : undefined,
          page,
        };

        let result: Action[];

        if (data.instruction) {
          result = await stagehand.observe(data.instruction, safeOptions);
        } else {
          result = await stagehand.observe(safeOptions);
        }

        return { result };
      },
      operation: "observe",
    });
  },
);

const observeRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/:id/observe",
  schema: {
    ...Api.Operations.SessionObserve,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    body: Api.ObserveRequestSchema,
    response: {
      200: Api.ObserveResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: observeRouteHandler,
};

export default observeRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/_id/replay.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";

import { authMiddleware } from "../../../../lib/auth.js";
import { withErrorHandling } from "../../../../lib/errorHandler.js";
import { error, success } from "../../../../lib/response.js";

const replayRouteHandler: RouteHandlerMethod = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return error(reply, "Unauthorized", StatusCodes.UNAUTHORIZED);
    }

    reply.log.warn("Replay endpoint not implemented for local server.");

    const replay: Api.ReplayResult = {
      pages: [],
    };

    return success(reply, replay);
  },
);

const replayRoute: RouteOptions = {
  method: "GET",
  url: "/sessions/:id/replay",
  schema: {
    ...Api.Operations.SessionReplay,
    headers: Api.SessionHeadersSchema,
    params: Api.SessionIdParamsSchema,
    response: {
      200: Api.ReplayResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: replayRouteHandler,
};

export default replayRoute;


================================================
FILE: packages/server-v3/src/routes/v1/sessions/start.ts
================================================
import type { RouteHandler, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import Browserbase from "@browserbasehq/sdk";
import { Api } from "@browserbasehq/stagehand";
import type { SessionRetrieveResponse } from "@browserbasehq/sdk/resources/sessions/sessions";
import { type FastifyZodOpenApiSchema } from "fastify-zod-openapi";
import { z } from "zod/v4";

import { authMiddleware } from "../../../lib/auth.js";
import { withErrorHandling } from "../../../lib/errorHandler.js";
import { getModelApiKey, getOptionalHeader } from "../../../lib/header.js";
import { error, success } from "../../../lib/response.js";
import { getSessionStore } from "../../../lib/sessionStoreManager.js";
import { AISDK_PROVIDERS } from "../../../types/model.js";

// Extended schema with custom refinement for local browser validation
const startBodySchema = z
  .preprocess((value) => {
    if (!value || typeof value !== "object") {
      return value;
    }
    const record = value as Record<string, unknown>;
    if (
      typeof record.verbose === "string" &&
      ["0", "1", "2"].includes(record.verbose)
    ) {
      return { ...record, verbose: Number(record.verbose) };
    }
    return value;
  }, Api.SessionStartRequestSchema)
  .superRefine((value, ctx) => {
    if (value.browser?.type === "local") {
      const hasConnect = Boolean(value.browser.cdpUrl);
      const hasLaunch = Boolean(value.browser.launchOptions);
      if (!hasConnect && !hasLaunch) {
        ctx.addIssue({
          code: z.ZodIssueCode.custom,
          path: ["browser"],
          message:
            "When browser.type is 'local', provide either browser.cdpUrl or browser.launchOptions.",
        });
      }
    }
  });

const startRouteHandler: RouteHandler = withErrorHandling(
  async (request, reply) => {
    if (!(await authMiddleware(request))) {
      return error(reply, "Unauthorized", StatusCodes.UNAUTHORIZED);
    }

    const sdkVersion = getOptionalHeader(request, "x-sdk-version");

    const clientLanguage = request.headers["x-language"] as string | undefined;
    if (
      clientLanguage &&
      !["typescript", "python", "playground"].includes(clientLanguage)
    ) {
      return error(
        reply,
        "Invalid client language header",
        StatusCodes.BAD_REQUEST,
      );
    }

    // Use the validated request body directly - fields come from Api.SessionStartRequestSchema
    const body = request.body as Api.SessionStartRequest;
    const {
      modelName,
      domSettleTimeoutMs,
      verbose,
      systemPrompt,
      browserbaseSessionCreateParams,
      selfHeal,
      waitForCaptchaSolves,
      browserbaseSessionID,
      experimental,
      browser,
    } = body;
    if (!modelName) {
      return error(reply, "Missing required model name");
    }

    // TODO: Remove this after complete AISDK migration. Validation should be done stagehand-side
    if (modelName.includes("/")) {
      const [providerName] = modelName.split("/", 1);
      if (!providerName) {
        return error(
          reply,
          `Invalid model: ${modelName}`,
          StatusCodes.BAD_REQUEST,
        );
      }
      if (!(AISDK_PROVIDERS as readonly string[]).includes(providerName)) {
        return error(
          reply,
          `Invalid provider: ${providerName}`,
          StatusCodes.BAD_REQUEST,
        );
      }
    }

    const browserType = browser?.type ?? "browserbase";

    let bbApiKey: string | undefined;
    let bbProjectId: string | undefined;
    let browserbaseSessionId: string | undefined;
    let connectUrl: string | undefined;

    if (browserType === "browserbase") {
      bbApiKey = getOptionalHeader(request, "x-bb-api-key");
      bbProjectId = getOptionalHeader(request, "x-bb-project-id");

      if (!bbApiKey) {
        return error(
          reply,
          "Missing required headers for browserbase sessions",
        );
      }

      const bb = new Browserbase({ apiKey: bbApiKey });

      if (browserbaseSessionID) {
        const existing = await bb.sessions.retrieve(browserbaseSessionID);
        browserbaseSessionId = existing?.id;
        connectUrl = existing?.connectUrl;
        if (!browserbaseSessionId) {
          return error(reply, "Failed to retrieve browserbase session");
        }
        if (!connectUrl) {
          return error(reply, "Browserbase session missing connectUrl");
        }
      } else {
        const resolvedProjectId =
          browserbaseSessionCreateParams?.projectId ?? bbProjectId;
        const createPayload = {
          ...(resolvedProjectId ? { projectId: resolvedProjectId } : {}),
          ...browserbaseSessionCreateParams,
          browserSettings: {
            ...(browserbaseSessionCreateParams?.browserSettings ?? {}),
            viewport: browserbaseSessionCreateParams?.browserSettings
              ?.viewport ?? {
              width: 1288,
              height: 711,
            },
          },
          userMetadata: {
            ...(browserbaseSessionCreateParams?.userMetadata ?? {}),
            stagehand: "true",
          },
        } satisfies Browserbase.Sessions.SessionCreateParams;

        const created = (await bb.sessions.create(
          createPayload,
        )) as SessionRetrieveResponse;

        browserbaseSessionId = created?.id;
        connectUrl = created?.connectUrl;
        if (!browserbaseSessionId) {
          return error(reply, "Failed to create browserbase session");
        }
        if (!connectUrl) {
          return error(reply, "Browserbase session missing connectUrl");
        }
      }
    }

    const sessionStore = getSessionStore();

    // For local browsers without a connectUrl, get it from browser.connectUrl
    if (browserType === "local") {
      connectUrl = browser?.cdpUrl;
    }

    const session = await sessionStore.startSession({
      browserType,
      connectUrl,
      browserbaseSessionID:
        browserType === "browserbase"
          ? (browserbaseSessionId ?? browserbaseSessionID)
          : undefined,
      browserbaseApiKey: bbApiKey,
      browserbaseProjectId: bbProjectId,
      modelName,
      domSettleTimeoutMs,
      verbose,
      systemPrompt,
      browserbaseSessionCreateParams,
      selfHeal,
      waitForCaptchaSolves,
      clientLanguage,
      sdkVersion,
      experimental,
      localBrowserLaunchOptions:
        browserType === "local" && (browser?.launchOptions || browser?.cdpUrl)
          ? {
              cdpUrl: browser?.cdpUrl,
              ...(browser?.launchOptions ?? {}),
            }
          : undefined,
    });

    // For local browsers with launchOptions (no explicit cdpUrl), eagerly
    // initialize the browser so we can return the actual CDP URL
    let finalCdpUrl = connectUrl ?? session.cdpUrl ?? "";
    if (browserType === "local" && browser?.launchOptions && !browser?.cdpUrl) {
      const modelApiKey = getModelApiKey(request);
      try {
        const stagehand = await sessionStore.getOrCreateStagehand(
          session.sessionId,
          { modelApiKey },
        );
        finalCdpUrl = stagehand.connectURL();
      } catch (err) {
        request.log.error(
          {
            err,
            sessionId: session.sessionId,
            browserType,
            chromePathEnv: process.env.CHROME_PATH,
            launchOptions: {
              executablePath: browser.launchOptions.executablePath,
              argsCount: browser.launchOptions.args?.length ?? 0,
              headless: browser.launchOptions.headless,
              hasUserDataDir: Boolean(browser.launchOptions.userDataDir),
              port: browser.launchOptions.port,
              connectTimeoutMs: browser.launchOptions.connectTimeoutMs,
            },
          },
          "Failed to initialize local browser session in /v1/sessions/start",
        );
        throw err;
      }
    }

    return success(reply, {
      sessionId: session.sessionId,
      available: session.available,
      cdpUrl: finalCdpUrl,
    });
  },
);

const startRoute: RouteOptions = {
  method: "POST",
  url: "/sessions/start",
  schema: {
    ...Api.Operations.SessionStart,
    headers: Api.SessionHeadersSchema,
    body: startBodySchema,
    response: {
      200: Api.SessionStartResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: startRouteHandler,
};

export default startRoute;


================================================
FILE: packages/server-v3/src/sea-entry.ts
================================================
import { __internalMaybeRunShutdownSupervisorFromArgv } from "@browserbasehq/stagehand";

// if SEA binary is launched with --supervisor, it will run the shutdown supervisor only
const argv = process.argv.slice(1);
const normalizedArgv = argv[0]?.startsWith("--") ? argv : argv.slice(1);

// otherwise, start the stagehand/server
if (!__internalMaybeRunShutdownSupervisorFromArgv(normalizedArgv)) {
  void import("./server.js").catch((err) => {
    console.error("Failed to start server:", err);
    process.exit(1);
  });
}


================================================
FILE: packages/server-v3/src/server.ts
================================================
import { randomUUID } from "crypto";

import cors from "@fastify/cors";
import fastify from "fastify";
import metricsPlugin from "fastify-metrics";
import fastifySwagger from "@fastify/swagger";
import fastifySwaggerUI from "@fastify/swagger-ui";
import {
  fastifyZodOpenApiPlugin,
  fastifyZodOpenApiTransformers,
  serializerCompiler,
  validatorCompiler,
  type FastifyZodOpenApiTypeProvider,
  RequestValidationError,
  ResponseSerializationError,
} from "fastify-zod-openapi";
import { StatusCodes } from "http-status-codes";

import { logging } from "./lib/logging/index.js";
import {
  destroySessionStore,
  initializeSessionStore,
} from "./lib/sessionStoreManager.js";
import healthcheckRoute from "./routes/healthcheck.js";
import readinessRoute, { setReady, setUnready } from "./routes/readiness.js";
import actRoute from "./routes/v1/sessions/_id/act.js";
import agentExecuteRoute from "./routes/v1/sessions/_id/agentExecute.js";
import endRoute from "./routes/v1/sessions/_id/end.js";
import extractRoute from "./routes/v1/sessions/_id/extract.js";
import navigateRoute from "./routes/v1/sessions/_id/navigate.js";
import observeRoute from "./routes/v1/sessions/_id/observe.js";
import replayRoute from "./routes/v1/sessions/_id/replay.js";
import startRoute from "./routes/v1/sessions/start.js";

// Constants for graceful shutdown
const READY_WAIT_PERIOD = 10_000; // 10 seconds
const GRACEFUL_SHUTDOWN_PERIOD = 30_000; // 30 seconds

const usePrettyLogs = process.env.NODE_ENV === "development" && !process.env.CI;

const app = fastify({
  disableRequestLogging: true,

  genReqId: () => {
    return randomUUID();
  },

  logger: {
    formatters: {
      level(label: string) {
        return { level: label };
      },
    },

    level: process.env.NODE_ENV === "production" ? "info" : "trace",

    ...(usePrettyLogs && {
      transport: {
        options: {
          colorize: true,
          ignore: "pid,hostname",
        },
        target: "pino-pretty",
      },
    }),
  },

  return503OnClosing: false,
});

export const logger = app.log;

// Allow requests with `Content-Type: application/json` and an empty body (0 bytes).
// Some clients always send the header even when there is no request body (e.g. /end).
const defaultJsonParser = app.getDefaultJsonParser("error", "error");
app.addContentTypeParser<string>(
  "application/json",
  { parseAs: "string" },
  (request, body, done) => {
    if (body === "" || (Buffer.isBuffer(body) && body.length === 0)) {
      done(null, {});
      return;
    }

    void defaultJsonParser(request, body, done);
  },
);

process.on("uncaughtException", (error) => {
  app.log.error(error, "Uncaught Exception:");
});

process.on("unhandledRejection", (reason, promise) => {
  app.log.error(
    reason instanceof Error ? reason : new Error(String(reason)),
    "Unhandled Rejection at:",
    promise,
    "reason:",
    reason,
  );
});

// Graceful shutdown handler
const gracefulShutdown = async () => {
  app.log.info("gracefulShutdown");

  setUnready();

  await new Promise((resolve) => setTimeout(resolve, READY_WAIT_PERIOD));

  const timeout = setTimeout(() => {
    app.log.warn("forcefully shutting down after 30 seconds");
    process.exit(1);
  }, GRACEFUL_SHUTDOWN_PERIOD);

  timeout.unref();

  await app.close();
  await destroySessionStore();
  clearTimeout(timeout);

  app.log.info("gracefulShutdown complete");
  process.exit(0);
};

// Handle termination signals
process.on("SIGTERM", () => {
  gracefulShutdown().catch((err: unknown) => {
    app.log.error(err, "error gracefully shutting down");
  });
});

process.on("SIGINT", () => {
  gracefulShutdown().catch((err: unknown) => {
    app.log.error(err, "error gracefully shutting down");
  });
});

const start = async () => {
  try {
    if (process.env.NODE_ENV === "development") {
      await app.register(cors, {
        origin: ["http://localhost:3000"],
        methods: ["GET", "POST", "PUT", "DELETE", "OPTIONS"],
        allowedHeaders: ["*"],
        credentials: true,
      });
    }

    app.setValidatorCompiler(validatorCompiler);
    app.setSerializerCompiler(serializerCompiler);

    await app.register(fastifyZodOpenApiPlugin);

    await app.register(fastifySwagger, {
      openapi: {
        info: {
          title: "Stagehand API",
          version: "3.0.5",
        },
        openapi: "3.1.0",
      },
      ...fastifyZodOpenApiTransformers,
    });

    // Only register Swagger UI in development - SEA binaries can't load static files
    if (process.env.NODE_ENV === "development") {
      await app.register(fastifySwaggerUI, {
        routePrefix: "/documentation",
      });
    }

    app.setSchemaErrorFormatter(function (errors, dataVar) {
      const zodIssues = errors
        .filter((err) => err instanceof RequestValidationError)
        .map((err) => err.params.issue);
      this.log.warn({ dataVar, zodIssues }, "request validation failed");
      return new Error(`${dataVar} validation failed`);
    });

    app.setErrorHandler((error, request, reply) => {
      if ((error as { validation?: unknown }).validation) {
        const zodIssues = (error as { validation: unknown[] }).validation
          .filter((err) => err instanceof RequestValidationError)
          .map((err) => (err as RequestValidationError).params.issue);

        request.log.warn({ zodIssues }, "request validation failed");
        return reply.status(StatusCodes.BAD_REQUEST).send({
          error: "Request validation failed",
          issues: zodIssues,
        });
      }

      if (error instanceof ResponseSerializationError) {
        request.log.error({ err: error }, "response serialization failed");
        return reply
          .status(StatusCodes.INTERNAL_SERVER_ERROR)
          .send({ error: "Response validation failed" });
      }

      const errorMessage =
        error instanceof Error ? error.message : String(error);
      request.log.error(`Server error: ${errorMessage}`);

      const statusCode =
        (error as { statusCode?: number }).statusCode ??
        StatusCodes.INTERNAL_SERVER_ERROR;

      reply.status(statusCode).send({
        error:
          statusCode === Number(StatusCodes.INTERNAL_SERVER_ERROR)
            ? "Internal Server Error"
            : errorMessage,
        statusCode,
      });
    });

    await app.register(metricsPlugin, {
      defaultMetrics: {
        enabled: true,
        prefix: "stagehand_api_",
      },
      routeMetrics: {
        overrides: {
          histogram: {
            name: "stagehand_api_http_request_duration_seconds",
          },
          summary: {
            name: "stagehand_api_http_request_summary_seconds",
          },
        },
      },
    });

    initializeSessionStore();

    const appWithTypes = app.withTypeProvider<FastifyZodOpenApiTypeProvider>();

    await appWithTypes.register(
      (instance, _opts, done) => {
        instance.route(actRoute);
        instance.route(endRoute);
        instance.route(extractRoute);
        instance.route(navigateRoute);
        instance.route(observeRoute);
        instance.route(replayRoute);
        instance.route(startRoute);
        instance.route(agentExecuteRoute);
        done();
      },
      { prefix: "/v1" },
    );

    logging(app);

    // Register health and readiness routes at the root level
    appWithTypes.route(healthcheckRoute);
    appWithTypes.route(readinessRoute);
    await app.ready();

    await app.listen({
      host: "0.0.0.0",
      port: parseInt(process.env.PORT ?? "3000", 10),
    });
    console.log("Routes registered:", app.printRoutes());

    // Mark the server as ready after it's started
    setReady();
  } catch (err) {
    console.error("Failed to start server:", err);
    process.exit(1);
  }
};

start().catch((err: unknown) => {
  console.error("Failed to start server:", err);
  process.exit(1);
});


================================================
FILE: packages/server-v3/src/types/error.ts
================================================
import { StatusCodes } from "http-status-codes";

import { AppError } from "../lib/errorHandler.js";

export class UnknownModelError extends AppError {
  constructor(model: string) {
    super(`Unknown model: ${model}`, StatusCodes.BAD_REQUEST);
  }
}
export class InvalidProviderError extends AppError {
  constructor(provider: string) {
    super(`Invalid provider: ${provider}`, StatusCodes.BAD_REQUEST);
  }
}

export class InvalidModelError extends AppError {
  constructor(model: string) {
    super(`Invalid model: ${model}`, StatusCodes.BAD_REQUEST);
  }
}

export class UnauthorizedError extends AppError {
  constructor() {
    super("Unauthorized", StatusCodes.UNAUTHORIZED);
  }
}

export class MissingHeaderError extends AppError {
  constructor(header: string) {
    super(`Missing required header: ${header}`, StatusCodes.BAD_REQUEST);
  }
}

export class InvalidAPIKeyError extends AppError {
  constructor(provider: string) {
    super(`Invalid API key for provider: ${provider}`, StatusCodes.BAD_REQUEST);
  }
}

export class AttemptedCloseOnNonActiveSessionError extends AppError {
  constructor() {
    super(
      "Attempted to close session that is not currently active",
      StatusCodes.CONFLICT,
    );
  }
}

interface BrowserbaseError {
  status?: number;
  statusCode?: number;
  message?: string;
  response?: {
    status?: number;
    data?: {
      message?: string;
    };
  };
}

export class BrowserbaseSDKError extends AppError {
  constructor(error: unknown, defaultMessage: string) {
    const browserbaseError = error as BrowserbaseError;
    const {
      message: errMessage,
      status,
      statusCode: errStatusCode,
      response,
    } = browserbaseError;

    let message = defaultMessage;
    let finalStatusCode = StatusCodes.BAD_REQUEST;

    // Extract message from error
    if (errMessage) {
      message = errMessage;
    } else if (response?.data?.message) {
      ({ message } = response.data);
    }

    // Extract status code from error
    if (status && typeof status === "number") {
      finalStatusCode = status as StatusCodes;
    } else if (errStatusCode && typeof errStatusCode === "number") {
      finalStatusCode = errStatusCode as StatusCodes;
    } else if (response?.status && typeof response.status === "number") {
      finalStatusCode = response.status as StatusCodes;
    }

    // Check for specific session error
    if (message.includes("is not running")) {
      throw new AttemptedCloseOnNonActiveSessionError();
    }

    // Mark 5xx errors as internal to sanitize sensitive details
    const isInternal =
      Number(finalStatusCode) >= Number(StatusCodes.INTERNAL_SERVER_ERROR);

    super(message, finalStatusCode, isInternal);
  }
}


================================================
FILE: packages/server-v3/src/types/fastify.d.ts
================================================
import "fastify";

declare module "fastify" {
  interface FastifyRequest {
    metrics: {
      startTime: number;
    };
  }
}


================================================
FILE: packages/server-v3/src/types/model.ts
================================================
export const AISDK_PROVIDERS = [
  "openai",
  "anthropic",
  "google",
  "xai",
  "azure",
  "groq",
  "cerebras",
  "togetherai",
  "mistral",
  "deepseek",
  "perplexity",
  "ollama",
  "vertex",
  "bedrock",
] as const;
export type AISDKProvider = (typeof AISDK_PROVIDERS)[number];

export type LegacyModel =
  | "gpt-4o"
  | "gpt-4o-mini"
  | "gpt-4o-2024-08-06"
  | "gpt-4o-2024-05-13"
  | "cerebras-llama-3.3-70b"
  | "cerebras-llama-3.1-8b"
  | "o1-mini"
  | "o1-preview"
  | "o3-mini"
  | "gpt-4.5-preview"
  | "groq-llama-3.3-70b-specdec"
  | "groq-llama-3.3-70b-versatile"
  | "gemini-1.5-flash"
  | "gemini-1.5-pro"
  | "gemini-1.5-flash-8b"
  | "gemini-2.0-flash-lite"
  | "gemini-2.0-flash"
  | "gemini-2.5-pro-preview-03-25"
  | "gemini-2.5-flash-preview-04-17";

export type LegacyProvider = "openai" | "anthropic" | "google";


================================================
FILE: packages/server-v3/src/types/rrweb.ts
================================================
export interface Node {
  type: string;
  tagName?: string;
  attributes?: Record<string, string>;
  childNodes?: Node[];
  textContent?: string;
  id: number;
}

export interface Event {
  type: number;
  /*
  The data object is different for each event type
  but we're only accessing it when the data follows
  this structure, so we can just type this way.
  */
  data: { node: Node };
  sessionId?: string;
  timestamp: Date;
  actionId: string;
}


================================================
FILE: packages/server-v3/test/integration/api-server-cache.test.ts
================================================
import assert from "node:assert/strict";
import { after, before, describe, it } from "node:test";

import {
  assertFetchOk,
  assertFetchStatus,
  createSession,
  endSession,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  HTTP_OK,
  navigateSession,
} from "./utils.js";

// Shared read-only session — extract is safe to re-use across tests.
let sessionId: string;

before(async () => {
  sessionId = await createSession(getHeaders("3.0.0"));
  const nav = await navigateSession(
    sessionId,
    "https://example.com",
    getHeaders("3.0.0"),
  );
  assert.equal(nav.status, HTTP_OK, "Navigate should succeed");
});

after(async () => {
  await endSession(sessionId, getHeaders("3.0.0"));
});

// ---------------------------------------------------------------------------
// Helpers
// ---------------------------------------------------------------------------

function extractUrl() {
  return `${getBaseUrl()}/v1/sessions/${sessionId}/extract`;
}

function extractBody(instruction = "extract the page title") {
  return JSON.stringify({ instruction });
}

// ---------------------------------------------------------------------------
// browserbase-cache-bypass request header
// ---------------------------------------------------------------------------

describe("browserbase-cache-bypass request header", () => {
  it("request with bypass header does not return cache HIT", async () => {
    const ctx = await fetchWithContext(extractUrl(), {
      method: "POST",
      headers: {
        ...getHeaders("3.0.0"),
        "browserbase-cache-bypass": "true",
      },
      body: extractBody(),
    });

    assertFetchStatus(ctx, HTTP_OK, "Extract with bypass should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);

    const cacheStatus = ctx.headers.get("browserbase-cache-status");
    assert.notEqual(
      cacheStatus,
      "HIT",
      "A bypassed request must not return a cache HIT",
    );
  });
});

// ---------------------------------------------------------------------------
// browserbase-cache-status response header
// ---------------------------------------------------------------------------

describe("browserbase-cache-status response header", () => {
  it("returns HIT or MISS when the header is present", async () => {
    const ctx = await fetchWithContext(extractUrl(), {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: extractBody(),
    });

    assertFetchStatus(ctx, HTTP_OK, "Extract should succeed");

    const cacheStatus = ctx.headers.get("browserbase-cache-status");
    if (cacheStatus !== null) {
      assert.ok(
        cacheStatus === "HIT" || cacheStatus === "MISS",
        `browserbase-cache-status must be HIT or MISS, got: ${cacheStatus}`,
      );
    }
  });

  it("returns HIT on a repeated identical request when caching is active", async () => {
    const body = extractBody("count the number of links");

    // First call — warms the cache.
    const first = await fetchWithContext(extractUrl(), {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body,
    });
    assertFetchStatus(first, HTTP_OK, "First extract should succeed");

    // Second call — should be a HIT if server-side caching is enabled.
    const second = await fetchWithContext(extractUrl(), {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body,
    });
    assertFetchStatus(second, HTTP_OK, "Second extract should succeed");

    const cacheStatus = second.headers.get("browserbase-cache-status");
    if (cacheStatus !== null) {
      assert.equal(
        cacheStatus,
        "HIT",
        "Repeated identical request should be a cache HIT",
      );
    }
  });
});


================================================
FILE: packages/server-v3/test/integration/utils.ts
================================================
import fs from "node:fs";
import path from "node:path";
import { chromium } from "playwright";

// =============================================================================
// HTTP Status Codes
// =============================================================================

export const HTTP_OK = 200;
export const HTTP_BAD_REQUEST = 400;
export const HTTP_NOT_FOUND = 404;
export const HTTP_GONE = 410;
export const HTTP_UNPROCESSABLE_ENTITY = 422;
export const HTTP_INTERNAL_SERVER_ERROR = 500;

// =============================================================================
// Timing Constants
// =============================================================================

export const SESSION_CLOSE_WAIT_MS = 2000;

// =============================================================================
// Environment Variables
// =============================================================================

export const {
  STAGEHAND_API_URL,
  OPENAI_API_KEY,
  GEMINI_API_KEY,
  ANTHROPIC_API_KEY,
} = process.env;

// =============================================================================
// Utility Functions
// =============================================================================

export function requireEnv(name: string, value: string | undefined): string {
  if (!value) {
    throw new Error(`Missing required environment variable: ${name}`);
  }
  return value;
}

export function getBaseUrl(): string {
  return STAGEHAND_API_URL ?? "http://127.0.0.1:3107";
}

// =============================================================================
// Header Generators
// =============================================================================

export function getHeaders(
  sdkVersion: string,
  language: string = "typescript",
): Record<string, string> {
  return {
    "Content-Type": "application/json",
    "x-model-api-key": requireEnv("OPENAI_API_KEY", OPENAI_API_KEY),
    "x-language": language,
    "x-sdk-version": sdkVersion,
  };
}

// =============================================================================
// Session Management
// =============================================================================

export interface StartSessionResponse {
  success: boolean;
  message?: string;
  data?: {
    sessionId: string;
    cdpUrl: string;
    available: boolean;
  };
}

const SESSION_READY_DELAY_MS = 250;
const LOCAL_CONNECT_TIMEOUT_MS = (() => {
  const parsed = Number(process.env.STAGEHAND_TEST_LOCAL_CONNECT_TIMEOUT_MS);
  return Number.isFinite(parsed) && parsed > 0 ? parsed : 60_000;
})();

export interface SessionInfo {
  sessionId: string;
  cdpUrl: string;
}

function createLocalBrowserBody() {
  const resolveChromePath = (): string => {
    const explicit = process.env.CHROME_PATH;
    if (explicit && fs.existsSync(explicit)) {
      return explicit;
    }
    if (explicit) {
      throw new Error(`CHROME_PATH does not exist: ${explicit}`);
    }

    const playwrightPath = chromium.executablePath();
    if (playwrightPath && fs.existsSync(playwrightPath)) {
      return playwrightPath;
    }

    throw new Error(
      "Unable to locate a Chrome executable. Set CHROME_PATH in the test environment.",
    );
  };

  return {
    browser: {
      type: "local",
      launchOptions: {
        headless: true,
        executablePath: resolveChromePath(),
        args: process.env.CI ? ["--no-sandbox"] : undefined,
        connectTimeoutMs: LOCAL_CONNECT_TIMEOUT_MS,
      },
    },
  };
}

export const LOCAL_BROWSER_BODY = createLocalBrowserBody();

function readLaunchDiagnostics(launchOptions?: {
  executablePath?: string;
  args?: string[];
  headless?: boolean;
  userDataDir?: string;
  port?: number;
  connectTimeoutMs?: number;
}): string {
  const diagnostics: string[] = [];
  const userDataDir = launchOptions?.userDataDir;
  diagnostics.push("--- launch diagnostics ---");
  diagnostics.push(`CHROME_PATH env: ${process.env.CHROME_PATH ?? "<unset>"}`);
  diagnostics.push(`CI env: ${process.env.CI ?? "<unset>"}`);
  diagnostics.push(`userDataDir: ${userDataDir ?? "<auto>"}`);
  if (!userDataDir) {
    diagnostics.push(
      "chrome stdout/stderr logs unavailable (profile dir auto-managed by server launch)",
    );
  } else {
    diagnostics.push(`userDataDir exists: ${fs.existsSync(userDataDir)}`);
    if (fs.existsSync(userDataDir)) {
      const outPath = path.join(userDataDir, "chrome-out.log");
      const errPath = path.join(userDataDir, "chrome-err.log");
      if (fs.existsSync(outPath)) {
        diagnostics.push(
          `--- chrome stdout ---\n${fs.readFileSync(outPath, "utf8")}`,
        );
      }
      if (fs.existsSync(errPath)) {
        diagnostics.push(
          `--- chrome stderr ---\n${fs.readFileSync(errPath, "utf8")}`,
        );
      }
    }
  }
  if (launchOptions) {
    diagnostics.push(
      `launch.executablePath: ${launchOptions.executablePath ?? "<unset>"}`,
    );
    diagnostics.push(
      `launch.executablePath exists: ${
        launchOptions.executablePath
          ? fs.existsSync(launchOptions.executablePath)
          : false
      }`,
    );
    diagnostics.push(`launch.headless: ${String(launchOptions.headless)}`);
    diagnostics.push(
      `launch.args: ${JSON.stringify(launchOptions.args ?? [])}`,
    );
    diagnostics.push(`launch.port: ${launchOptions.port ?? "<auto>"}`);
    diagnostics.push(
      `launch.connectTimeoutMs: ${launchOptions.connectTimeoutMs ?? "<default>"}`,
    );
  }
  return diagnostics.join("\n");
}

export async function createSession(
  headers: Record<string, string>,
): Promise<string> {
  const info = await createSessionWithCdp(headers);
  return info.sessionId;
}

export async function createSessionWithCdp(
  headers: Record<string, string>,
): Promise<SessionInfo> {
  const url = getBaseUrl();
  const startPayload = {
    modelName: "gpt-4.1-nano",
    ...createLocalBrowserBody(),
  };

  const response = await fetch(`${url}/v1/sessions/start`, {
    method: "POST",
    headers,
    body: JSON.stringify(startPayload),
  });

  const responseText = await response.text();
  let parsedBody: unknown;
  try {
    parsedBody = responseText ? JSON.parse(responseText) : null;
  } catch {
    parsedBody = responseText;
  }
  const body = parsedBody as StartSessionResponse;

  if (!response.ok || !body?.success) {
    const launchDiagnostics = readLaunchDiagnostics(
      startPayload.browser?.launchOptions,
    );
    throw new Error(
      `Failed to create session (status=${response.status}): ${JSON.stringify(
        parsedBody,
      )}\n${launchDiagnostics}`,
    );
  }
  if (!body.data?.available) {
    throw new Error(`Session not available`);
  }
  if (!body.data.sessionId) {
    throw new Error("No sessionId returned");
  }
  if (!body.data.cdpUrl) {
    throw new Error("No cdpUrl returned");
  }

  // Wait for session to be fully ready before returning
  await new Promise((resolve) => setTimeout(resolve, SESSION_READY_DELAY_MS));

  return {
    sessionId: body.data.sessionId,
    cdpUrl: body.data.cdpUrl,
  };
}

export async function endSession(
  sessionId: string,
  headers: Record<string, string>,
): Promise<void> {
  const url = getBaseUrl();

  await fetch(`${url}/v1/sessions/${sessionId}/end`, {
    method: "POST",
    headers,
    body: JSON.stringify({}),
  });
}

// =============================================================================
// Navigation Helper
// =============================================================================

export async function navigateSession(
  sessionId: string,
  targetUrl: string,
  headers: Record<string, string>,
): Promise<Response> {
  const url = getBaseUrl();

  return fetch(`${url}/v1/sessions/${sessionId}/navigate`, {
    method: "POST",
    headers,
    body: JSON.stringify({ url: targetUrl, frameId: "" }),
  });
}

/**
 * Gets the main frame ID from a CDP session
 */
export async function getMainFrameId(cdpUrl: string): Promise<string> {
  const browser = await chromium.connectOverCDP(cdpUrl);
  try {
    const contexts = browser.contexts();
    if (contexts.length === 0) {
      throw new Error("No browser contexts found");
    }
    const pages = contexts[0]!.pages();
    if (pages.length === 0) {
      throw new Error("No pages found");
    }
    const page = pages[0]!;

    // Use CDP to get the frame tree and extract the main frame ID
    const cdpSession = await page.context().newCDPSession(page);
    const { frameTree } = await cdpSession.send("Page.getFrameTree");
    await cdpSession.detach();

    return frameTree.frame.id;
  } finally {
    await browser.close();
  }
}

// =============================================================================
// SSE Stream Reader
// =============================================================================

// Legacy SSE event interface (generic)
export interface SSEEvent {
  event?: string;
  data?: string;
  parsed?: unknown;
}

export async function readSSEStream(response: Response): Promise<SSEEvent[]> {
  const reader = response.body?.getReader() as
    | ReadableStreamDefaultReader<Uint8Array>
    | undefined;
  if (!reader) {
    throw new Error("No response body reader available");
  }

  const decoder = new TextDecoder();
  let fullResponse = "";

  for (;;) {
    const result = await reader.read();
    if (result.done) break;
    fullResponse += decoder.decode(result.value, { stream: true });
  }

  // Parse SSE events
  const events: SSEEvent[] = [];
  const rawEvents = fullResponse.split("\n\n").filter((e) => e.trim());

  for (const rawEvent of rawEvents) {
    const event: SSEEvent = {};
    const lines = rawEvent.split("\n");

    for (const line of lines) {
      if (line.startsWith("event:")) {
        event.event = line.slice(6).trim();
      } else if (line.startsWith("data:")) {
        event.data = line.slice(5).trim();
        try {
          event.parsed = JSON.parse(event.data);
        } catch {
          // Keep as string if not valid JSON
        }
      }
    }

    if (event.data || event.event) {
      events.push(event);
    }
  }

  return events;
}

// =============================================================================
// Typed SSE Event Helpers (for stagehand-api backend format)
// =============================================================================

// Actual SSE event format from backend (see stream.ts):
// { data: { status: "starting" | "connected" | "finished", result?: ... }, type: "system" | "log", id: "<uuid>" }
export interface TypedSSEEvent<TResult = unknown> {
  data: {
    status: string;
    result?: TResult;
    message?: string;
    error?: string;
  };
  type: string;
  id: string;
}

/**
 * Read SSE stream from response and return raw string
 */
export async function readSSEStreamRaw(response: Response): Promise<string> {
  const reader = response.body?.getReader() as
    | ReadableStreamDefaultReader<Uint8Array>
    | undefined;
  if (!reader) throw new Error("No response body reader");

  const decoder = new TextDecoder();
  let fullResponse = "";

  for (;;) {
    const result = await reader.read();
    if (result.done) break;
    fullResponse += decoder.decode(result.value, { stream: true });
  }

  return fullResponse;
}

/**
 * Parse raw SSE response string into typed events
 */
export function parseTypedSSEEvents<TResult = unknown>(
  rawResponse: string,
): TypedSSEEvent<TResult>[] {
  const events = rawResponse.split("\n\n").filter((e) => e.trim());
  return events
    .map((event) => {
      const dataMatch = event.match(/data: (.+)/);
      if (dataMatch?.[1]) {
        return JSON.parse(dataMatch[1]) as TypedSSEEvent<TResult>;
      }
      return null;
    })
    .filter((e): e is TypedSSEEvent<TResult> => e !== null);
}

/**
 * Result of reading an SSE stream with full context for debugging
 */
export interface SSEStreamResult<TResult = unknown> {
  /** HTTP status code */
  status: number;
  /** HTTP status text */
  statusText: string;
  /** Raw response body */
  raw: string;
  /** Parsed SSE events */
  events: TypedSSEEvent<TResult>[];
  /** Get debug summary for error messages */
  debugSummary(): string;
}

/**
 * Read SSE stream and parse into typed events (legacy - no debug context)
 */
export async function readTypedSSEStream<TResult = unknown>(
  response: Response,
): Promise<TypedSSEEvent<TResult>[]> {
  const raw = await readSSEStreamRaw(response);
  return parseTypedSSEEvents<TResult>(raw);
}

/**
 * Read SSE stream with full context for debugging test failures.
 * Use this instead of readTypedSSEStream when you need better error messages.
 */
export async function readTypedSSEStreamWithContext<TResult = unknown>(
  response: Response,
): Promise<SSEStreamResult<TResult>> {
  const status = response.status;
  const statusText = response.statusText;
  const raw = await readSSEStreamRaw(response);
  const events = parseTypedSSEEvents<TResult>(raw);

  return {
    status,
    statusText,
    raw,
    events,
    debugSummary() {
      const eventStatuses = events.map((e) => e.data.status).join(" → ");
      const errorEvents = events.filter((e) => e.data.status === "error");
      const errorMessages = errorEvents
        .map((e) => e.data.error ?? "unknown error")
        .join(", ");

      let summary = `HTTP ${status} ${statusText}`;
      if (events.length === 0) {
        summary += `\n  No SSE events received`;
        summary += `\n  Raw response: ${raw.slice(0, 500)}${raw.length > 500 ? "..." : ""}`;
      } else {
        summary += `\n  Events (${events.length}): ${eventStatuses}`;
        if (errorMessages) {
          summary += `\n  Errors: ${errorMessages}`;
        }
      }
      return summary;
    },
  };
}

/**
 * Assert with debug context - includes SSE stream info on failure
 */
export function assertWithContext(
  condition: boolean,
  message: string,
  context: SSEStreamResult<unknown>,
): asserts condition {
  if (!condition) {
    throw new Error(`${message}\n\nDebug context:\n${context.debugSummary()}`);
  }
}

/**
 * Assert SSE event exists with debug context on failure, returns the found event
 */
export function assertEventExists<TResult>(
  events: TypedSSEEvent<TResult>[],
  status: string,
  context: SSEStreamResult<TResult>,
): TypedSSEEvent<TResult> {
  const found = events.find((e) => e.data.status === status);
  assertWithContext(
    found !== undefined,
    `Should have a "${status}" event`,
    context,
  );
  return found;
}

/**
 * Assert HTTP status with debug context on failure
 */
export function assertHttpStatus(
  context: SSEStreamResult<unknown>,
  expectedStatus: number,
  message?: string,
): void {
  assertWithContext(
    context.status === expectedStatus,
    message ?? `Expected HTTP ${expectedStatus}, got ${context.status}`,
    context,
  );
}

// =============================================================================
// JSON Response Debug Utilities (for non-SSE tests)
// =============================================================================

/**
 * Result of a fetch request with full context for debugging
 */
export interface FetchResult<T = unknown> {
  /** HTTP status code */
  status: number;
  /** HTTP status text */
  statusText: string;
  /** Parsed JSON body (if parseable) */
  body: T | null;
  /** Raw response text */
  raw: string;
  /** Request duration in ms */
  durationMs: number;
  /** Response headers */
  headers: Headers;
  /** Get debug summary for error messages */
  debugSummary(): string;
}

/**
 * Fetch with full context for debugging test failures.
 * Captures timing, status, and response body.
 */
export async function fetchWithContext<T = unknown>(
  url: string,
  options: RequestInit,
): Promise<FetchResult<T>> {
  const startTime = Date.now();
  let response: Response;

  try {
    response = await fetch(url, options);
  } catch (err) {
    const durationMs = Date.now() - startTime;
    const errorMsg = err instanceof Error ? err.message : String(err);
    return {
      status: 0,
      statusText: "FETCH_ERROR",
      body: null,
      raw: errorMsg,
      durationMs,
      headers: new Headers(),
      debugSummary() {
        return `Fetch failed after ${durationMs}ms: ${errorMsg}`;
      },
    };
  }

  const durationMs = Date.now() - startTime;
  const status = response.status;
  const statusText = response.statusText;
  const headers = response.headers;
  const raw = await response.text();

  let body: T | null = null;
  try {
    body = JSON.parse(raw) as T;
  } catch {
    // Keep body as null if not valid JSON
  }

  return {
    status,
    statusText,
    body,
    raw,
    durationMs,
    headers,
    debugSummary() {
      const seconds = (durationMs / 1000).toFixed(1);
      let summary = `HTTP ${status} ${statusText} (${seconds}s)`;

      if (body && typeof body === "object") {
        const b = body as Record<string, unknown>;
        if (b.success === false && typeof b.message === "string") {
          summary += `\n  Error: ${b.message}`;
        }
        if (typeof b.error === "string") {
          summary += `\n  Error: ${b.error}`;
        }
      }

      // Show raw response if it's an error or unexpected
      if (status >= 400 || !body) {
        const truncated = raw.slice(0, 500);
        summary += `\n  Response: ${truncated}${raw.length > 500 ? "..." : ""}`;
      }

      return summary;
    },
  };
}

/**
 * Assert with fetch context - includes response info on failure
 */
export function assertFetchOk<T>(
  condition: boolean,
  message: string,
  context: FetchResult<T>,
): asserts condition {
  if (!condition) {
    throw new Error(`${message}\n\nDebug context:\n${context.debugSummary()}`);
  }
}

/**
 * Assert fetch succeeded with expected status
 */
export function assertFetchStatus<T>(
  context: FetchResult<T>,
  expectedStatus: number,
  message?: string,
): void {
  assertFetchOk(
    context.status === expectedStatus,
    message ?? `Expected HTTP ${expectedStatus}, got ${context.status}`,
    context,
  );
}

// =============================================================================
// Test Context Manager
// =============================================================================

export class TestSession {
  public sessionId: string | null = null;
  private headers: Record<string, string>;

  constructor(headers: Record<string, string>) {
    this.headers = headers;
  }

  async start(): Promise<string> {
    this.sessionId = await createSession(this.headers);
    return this.sessionId;
  }

  async navigate(targetUrl: string): Promise<Response> {
    if (!this.sessionId) {
      throw new Error("Session not started");
    }
    return navigateSession(this.sessionId, targetUrl, this.headers);
  }

  async end(): Promise<void> {
    if (this.sessionId) {
      try {
        await endSession(this.sessionId, this.headers);
      } catch {
        // Ignore errors when ending session
      }
      this.sessionId = null;
    }
  }

  getSessionId(): string {
    if (!this.sessionId) {
      throw new Error("Session not started");
    }
    return this.sessionId;
  }
}


================================================
FILE: packages/server-v3/test/integration/v3/act.test.ts
================================================
import assert from "node:assert/strict";
import { after, before, beforeEach, describe, it } from "node:test";

import { chromium } from "playwright";

import {
  assertEventExists,
  assertFetchOk,
  assertFetchStatus,
  assertWithContext,
  createSessionWithCdp,
  endSession,
  fetchWithContext,
  GEMINI_API_KEY,
  getBaseUrl,
  getHeaders,
  getMainFrameId,
  HTTP_OK,
  navigateSession,
  OPENAI_API_KEY,
  readTypedSSEStreamWithContext,
  requireEnv,
} from "../utils.js";

interface ActResponse {
  success: boolean;
  data?: {
    result: { success: boolean; message?: string };
    actionId?: string;
  };
}

/** Result type for act SSE events */
interface ActResult {
  success: boolean;
  message?: string;
  action?: string;
}

// Module-level session variable shared across all describe blocks
let sessionId: string;
let cdpUrl: string;

// Single session creation for all tests
before(async () => {
  ({ sessionId, cdpUrl } = await createSessionWithCdp(getHeaders("3.0.0")));
});

// Navigate back to example.com before each test since act() may navigate away
beforeEach(async () => {
  const navResponse = await navigateSession(
    sessionId,
    "https://example.com",
    getHeaders("3.0.0"),
  );
  assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
});

// Single session cleanup after all tests
after(async () => {
  await endSession(sessionId, getHeaders("3.0.0"));
});

// =============================================================================
// POST /v1/sessions/:id/act (V3 Format)
// =============================================================================

describe("POST /v1/sessions/:id/act (V3)", () => {
  // ===========================================================================
  // V3 Format Tests
  // ===========================================================================

  it("should perform an action using string input format", async () => {
    const url = getBaseUrl();
    const frameId = await getMainFrameId(cdpUrl);

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
        },
        body: JSON.stringify({
          input: "click the Learn more link",
          frameId,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "act should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );

    // Verify navigation via CDP
    const browser = await chromium.connectOverCDP(cdpUrl);
    const contexts = browser.contexts();
    assert.ok(contexts.length > 0, "Should have at least one browser context");
    const pages = contexts[0]!.pages();
    assert.ok(pages.length > 0, "Should have at least one page");
    const pageUrl = pages[0]!.url();
    assert.ok(
      pageUrl.includes("iana.org/help/example-domains"),
      `Page URL should be iana.org/help/example-domains, got: ${pageUrl}`,
    );
    await browser.close();
  });

  it("should perform an action using object input format", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
        },
        body: JSON.stringify({
          input: {
            selector: "a",
            description: "Click a link on the page",
            method: "click",
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "act with object input should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );
  });

  it("should accept options with string input", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
        },
        body: JSON.stringify({
          input: "click the Learn more link",
          options: {
            timeout: 30000,
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "act with options should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );
  });

  // ===========================================================================
  // V3 Inline Model Configuration Tests
  // ===========================================================================

  it("should perform action with inline model config (modelName + apiKey)", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
          "x-model-api-key": "", // Clear the header to ensure body config is used
        },
        body: JSON.stringify({
          input: "click the Learn more link",
          options: {
            model: {
              modelName: "openai/gpt-4.1-nano",
              apiKey: openaiApiKey,
            },
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "act with inline model config should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );
  });

  it("should perform action with inline model config and options", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
          "x-model-api-key": "", // Clear the header to ensure body config is used
        },
        body: JSON.stringify({
          input: "click the Learn more link",
          options: {
            model: {
              modelName: "openai/gpt-4.1-nano",
              apiKey: openaiApiKey,
            },
            timeout: 30000,
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "act with inline model config and options should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );
  });

  it("should perform action with object input and inline model config", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
          "x-model-api-key": "", // Clear the header to ensure body config is used
        },
        body: JSON.stringify({
          input: {
            selector: "a",
            description: "Click a link on the page",
            method: "click",
          },
          options: {
            model: {
              modelName: "openai/gpt-4.1-nano",
              apiKey: openaiApiKey,
            },
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "act with object input and inline model config should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );
  });

  it("should perform action with google/gemini-2.5-flash-lite model", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<ActResponse>(
      `${url}/v1/sessions/${sessionId}/act`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
          "x-model-api-key": "", // Clear the header to ensure body config is used
        },
        body: JSON.stringify({
          input: "click the Learn more link",
          options: {
            model: {
              modelName: "google/gemini-2.5-flash-lite",
              apiKey: geminiApiKey,
            },
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "act with google/gemini-2.5-flash-lite model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result.success,
      "boolean",
      "Result should have success boolean",
    );
  });
});

// =============================================================================
// SSE Streaming Tests (V3)
// =============================================================================

describe("POST /v1/sessions/:id/act with SSE streaming (V3)", () => {
  it("should stream valid SSE events with correct structure", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/act`, {
      method: "POST",
      headers: {
        ...getHeaders("3.0.0"),
      },
      body: JSON.stringify({
        input: "click the Learn more link",
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ActResult>(response);
    const { events } = ctx;

    assertWithContext(
      events.length >= 2,
      "Should have at least starting and finished events",
      ctx,
    );

    // Verify starting event
    const startingEvent = assertEventExists(events, "starting", ctx);
    assert.equal(
      startingEvent.type,
      "system",
      "Starting event should be system type",
    );

    // Verify finished event with result
    const finishedEvent = assertEventExists(events, "finished", ctx);
    assert.equal(
      finishedEvent.type,
      "system",
      "Finished event should be system type",
    );
    assertWithContext(
      !!finishedEvent.data.result,
      "Finished event must have result",
      ctx,
    );
    assert.equal(
      typeof finishedEvent.data.result.success,
      "boolean",
      "Result.success must be a boolean",
    );
  });

  it("should stream SSE events with inline model config", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const response = await fetch(`${url}/v1/sessions/${sessionId}/act`, {
      method: "POST",
      headers: {
        ...getHeaders("3.0.0"),
        "x-model-api-key": "", // Clear the header to ensure body config is used
      },
      body: JSON.stringify({
        input: "click the Learn more link",
        options: {
          model: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
        },
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ActResult>(response);
    const { events } = ctx;

    assertWithContext(
      events.length >= 2,
      "Should have at least starting and finished events",
      ctx,
    );

    // Verify starting event
    const startingEvent = assertEventExists(events, "starting", ctx);
    assert.equal(
      startingEvent.type,
      "system",
      "Starting event should be system type",
    );

    // Verify finished event with result
    const finishedEvent = assertEventExists(events, "finished", ctx);
    assert.equal(
      finishedEvent.type,
      "system",
      "Finished event should be system type",
    );
    assertWithContext(
      !!finishedEvent.data.result,
      "Finished event must have result",
      ctx,
    );
    assert.equal(
      typeof finishedEvent.data.result.success,
      "boolean",
      "Result.success must be a boolean",
    );
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/agentExecute.test.ts
================================================
import assert from "node:assert/strict";
import { after, before, beforeEach, describe, it } from "node:test";

import {
  assertFetchOk,
  assertFetchStatus,
  assertWithContext,
  createSession,
  createSessionWithCdp,
  endSession,
  fetchWithContext,
  GEMINI_API_KEY,
  getBaseUrl,
  getHeaders,
  getMainFrameId,
  HTTP_BAD_REQUEST,
  HTTP_OK,
  HTTP_UNPROCESSABLE_ENTITY,
  navigateSession,
  OPENAI_API_KEY,
  readTypedSSEStreamWithContext,
  requireEnv,
} from "../utils.js";

// =============================================================================
// POST /v1/sessions/:id/agentExecute (V3 Format)
// =============================================================================

describe("POST /v1/sessions/:id/agentExecute (V3) - Basic Config", () => {
  let sessionId: string;
  let cdpUrl: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    ({ sessionId, cdpUrl } = await createSessionWithCdp(headers));
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should execute agent with basic config (empty agentConfig)", async () => {
    const url = getBaseUrl();
    const frameId = await getMainFrameId(cdpUrl);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {},
        executeOptions: {
          instruction: "Describe the main heading on this page",
          frameId,
        },
      }),
    });

    assertFetchStatus(ctx, HTTP_OK, "V3 agent execute should succeed");
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with string agentConfig.model", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: "gpt-4.1-nano",
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with string model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with object model config (provider + modelName)", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            provider: "openai",
            modelName: "gpt-4.1-nano",
          },
        },
        executeOptions: {
          instruction: "Describe the page content",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with object model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with systemPrompt and maxSteps", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          systemPrompt: "You are a helpful web browsing assistant.",
        },
        executeOptions: {
          instruction: "Find and describe the main content",
          maxSteps: 3,
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with systemPrompt and maxSteps should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });
});

// ===========================================================================
// V3 Format Tests with model: {modelName, apiKey} format - Google Gemini
// ===========================================================================

describe("POST /v1/sessions/:id/agentExecute (V3) - Google Gemini with API key", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should execute agent with Google model object containing modelName and apiKey", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
            apiKey: geminiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with Google model object should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with Google model object, systemPrompt, and maxSteps", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
            apiKey: geminiApiKey,
          },
          systemPrompt: "You are a helpful web browsing assistant.",
        },
        executeOptions: {
          instruction: "Find and read the main heading",
          maxSteps: 3,
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with Google model, systemPrompt and maxSteps should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });
});

// ===========================================================================
// V3 Format Tests with OpenAI model: {modelName, apiKey} format
// ===========================================================================

describe("POST /v1/sessions/:id/agentExecute (V3) - OpenAI with API key", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should execute agent with OpenAI model object containing modelName and apiKey", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with OpenAI model object should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });
});

// ===========================================================================
// V3 CUA Mode Tests - Testing explicit cua flag with model compatibility
// ===========================================================================

describe("POST /v1/sessions/:id/agentExecute (V3) - CUA flag compatibility", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should execute agent with cua: true and CUA model (valid combination)", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          cua: true,
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
            apiKey: geminiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with cua: true and CUA model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with cua: false and non-CUA model (valid combination)", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          cua: false,
          model: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with cua: false and non-CUA model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with cua: false and CUA model (works in non-CUA mode)", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      message?: string;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          cua: false,
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
            apiKey: geminiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with cua: false and Google CUA model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should fail with cua: true and non-CUA model (invalid combination)", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      message?: string;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          cua: true,
          model: {
            modelName: "google/gemini-2.5-flash-lite",
            apiKey: geminiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_UNPROCESSABLE_ENTITY,
      "V3 agent execute with cua: true and non-CUA model should fail",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(!ctx.body.success, "Response should indicate failure", ctx);
  });

  it("should prefer mode over cua when both are provided", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          cua: true,
          mode: "dom",
          model: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with mode: dom and cua: true should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });
});

// =============================================================================
// V3 executionModel Tests - Testing agentConfig.executionModel serialization
// =============================================================================

describe("POST /v1/sessions/:id/agentExecute (V3) - executionModel serialization", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should execute agent with string executionModel", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          executionModel: "gpt-4.1-nano",
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with string executionModel should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with object executionModel (modelName and apiKey)", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          executionModel: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
        },
        executeOptions: {
          instruction: "Describe the main content of this page",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with object executionModel should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with both model and executionModel", async () => {
    const url = getBaseUrl();
    const openaiApiKey = requireEnv("OPENAI_API_KEY", OPENAI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
          executionModel: {
            modelName: "openai/gpt-4.1-nano",
            apiKey: openaiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with both model and executionModel should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });
});

// =============================================================================
// V3 Mode Tests - Testing agentConfig.mode field (dom, hybrid, cua)
// =============================================================================

describe("POST /v1/sessions/:id/agentExecute - agentConfig.mode (V3)", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should execute agent with mode: dom", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          mode: "dom",
        },
        executeOptions: {
          instruction: "What is the title of this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with mode: dom should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with mode: hybrid", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          mode: "hybrid",
          model: {
            provider: "google", // bonus: test split provider/modelName format
            modelName: "gemini-2.5-flash-preview-04-17",
            apiKey: geminiApiKey,
          },
        },
        executeOptions: {
          instruction: "Describe the main heading on this page",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with mode: hybrid should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });

  it("should execute agent with mode: cua and CUA model", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          mode: "cua",
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
            apiKey: geminiApiKey,
          },
        },
        executeOptions: {
          instruction: "What is visible on this page?",
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "V3 agent execute with mode: cua and CUA model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.result !== undefined,
      "Response should have result",
      ctx,
    );
  });
});

// =============================================================================
// SSE Streaming Tests (V3)
// =============================================================================

describe("POST /v1/sessions/:id/agentExecute with SSE streaming (V3)", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should stream SSE events with valid structure, sequence, and UUIDs", async () => {
    const url = getBaseUrl();

    const response = await fetch(
      `${url}/v1/sessions/${sessionId}/agentExecute`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          agentConfig: {},
          executeOptions: {
            instruction: "Describe the main content on the page",
          },
          streamResponse: true,
        }),
      },
    );

    const ctx = await readTypedSSEStreamWithContext(response);

    // Verify event count
    assertWithContext(
      ctx.events.length >= 2,
      "Should have at least starting and finished events",
      ctx,
    );

    // Verify event sequence
    const startingIndex = ctx.events.findIndex(
      (e) => e.data.status === "starting",
    );
    const connectedIndex = ctx.events.findIndex(
      (e) => e.data.status === "connected",
    );
    const finishedIndex = ctx.events.findIndex(
      (e) => e.data.status === "finished",
    );

    assertWithContext(
      startingIndex !== -1,
      "Should have a starting event",
      ctx,
    );
    assertWithContext(
      connectedIndex !== -1,
      "Should have a connected event",
      ctx,
    );
    assertWithContext(
      finishedIndex !== -1,
      "Should have a finished event",
      ctx,
    );
    assertWithContext(
      startingIndex < connectedIndex,
      "Starting event must come before connected event",
      ctx,
    );
    assertWithContext(
      connectedIndex < finishedIndex,
      "Connected event must come before finished event",
      ctx,
    );

    // Verify event types
    const startingEvent = ctx.events[startingIndex];
    const finishedEvent = ctx.events[finishedIndex];

    assertWithContext(
      startingEvent !== undefined,
      "Starting event should exist",
      ctx,
    );
    assertWithContext(
      finishedEvent !== undefined,
      "Finished event should exist",
      ctx,
    );
    assertWithContext(
      startingEvent.type === "system",
      "Starting event should be system type",
      ctx,
    );
    assertWithContext(
      finishedEvent.type === "system",
      "Finished event should be system type",
      ctx,
    );
    assertWithContext(
      finishedEvent.data.result !== undefined,
      "Finished event must have result",
      ctx,
    );

    // Verify UUID format
    const uuidRegex =
      /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;

    for (const event of ctx.events) {
      assertWithContext(
        uuidRegex.test(event.id),
        `Event id should be a valid UUID format, got: ${event.id}`,
        ctx,
      );
    }
  });
});

// =============================================================================
// Validation Error Tests (V3)
// =============================================================================

describe("POST /v1/sessions/:id/agentExecute - validation errors (V3)", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    sessionId = await createSession(headers);
  });

  beforeEach(async () => {
    // Navigate to example.com before each test (including first)
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should return 400 when agentConfig is missing", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success?: boolean;
      error?: string;
      message?: string;
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        executeOptions: {
          instruction: "Do something",
        },
      }),
    });

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(
      !ctx.body?.success || ctx.body.error !== undefined,
      "Response should indicate failure",
      ctx,
    );
  });

  it("should return 400 when executeOptions is missing", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success?: boolean;
      error?: string;
      message?: string;
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
          },
        },
      }),
    });

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(
      !ctx.body?.success || ctx.body.error !== undefined,
      "Response should indicate failure",
      ctx,
    );
  });

  it("should return 400 when instruction is missing", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success?: boolean;
      error?: string;
      message?: string;
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          model: {
            modelName: "google/gemini-2.5-computer-use-preview-10-2025",
          },
        },
        executeOptions: {
          maxSteps: 5,
        },
      }),
    });

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(
      !ctx.body?.success || ctx.body.error !== undefined,
      "Response should indicate failure",
      ctx,
    );
  });

  it("should return 400 for invalid agentConfig.mode", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success?: boolean;
      error?: string;
      message?: string;
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {
          mode: "invalid-mode",
        },
        executeOptions: {
          instruction: "Do something",
        },
      }),
    });

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(
      !ctx.body?.success || ctx.body.error !== undefined,
      "Response should indicate failure",
      ctx,
    );
  });
});

// =============================================================================
// V3 Format Tests - executeOptions.useSearch and executeOptions.toolTimeout
// =============================================================================

describe("POST /v1/sessions/:id/agentExecute (V3) - useSearch & toolTimeout", () => {
  let sessionId: string;
  const headers = getHeaders("3.0.0");

  before(async () => {
    ({ sessionId } = await createSessionWithCdp(headers));
  });

  beforeEach(async () => {
    const navResponse = await navigateSession(
      sessionId,
      "https://example.com",
      headers,
    );
    assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
  });

  after(async () => {
    if (sessionId) {
      await endSession(sessionId, headers);
      sessionId = "";
    }
  });

  it("should accept executeOptions.useSearch as boolean", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {},
        executeOptions: {
          instruction: "Describe the main heading on this page",
          useSearch: true,
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Agent execute with useSearch should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
  });

  it("should accept executeOptions.toolTimeout as number", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {},
        executeOptions: {
          instruction: "Describe the main heading on this page",
          toolTimeout: 30000,
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Agent execute with toolTimeout should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
  });

  it("should accept both useSearch and toolTimeout together", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/agentExecute`, {
      method: "POST",
      headers,
      body: JSON.stringify({
        agentConfig: {},
        executeOptions: {
          instruction: "Describe the main heading on this page",
          useSearch: false,
          toolTimeout: 60000,
        },
      }),
    });

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Agent execute with both options should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/end.test.ts
================================================
import { after, before, describe, it } from "node:test";

import assert from "node:assert/strict";

import {
  assertFetchOk,
  assertFetchStatus,
  createSession,
  endSession,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  HTTP_BAD_REQUEST,
  HTTP_NOT_FOUND,
  HTTP_INTERNAL_SERVER_ERROR,
  HTTP_OK,
} from "../utils.js";

// =============================================================================
// POST /v1/sessions/:id/end (V3 Format)
// =============================================================================

describe("POST /v1/sessions/:id/end (V3)", () => {
  const headers = getHeaders("3.0.0");
  let sessionId: string;

  before(async () => {
    sessionId = await createSession(headers);
  });

  after(async () => {
    // Try to clean up in case test didn't end the session
    try {
      await endSession(sessionId, headers);
    } catch {
      // Ignore - session may already be ended
    }
  });

  it("should return 200 if JSON content-type has an empty body", async () => {
    const url = getBaseUrl();
    // Create a fresh session for this test since we need to test error cases
    const testSessionId = await createSession(headers);

    const response = await fetch(`${url}/v1/sessions/${testSessionId}/end`, {
      method: "POST",
      headers: {
        ...headers,
        "Content-Type": "application/json",
      },
      body: "",
    });

    // Empty body should be accepted
    assertFetchStatus(
      {
        status: response.status,
        statusText: response.statusText,
        body: null,
        raw: "",
        durationMs: 0,
        headers: response.headers,
        debugSummary: () => `HTTP ${response.status}`,
      },
      HTTP_OK,
      "Should return 200 for empty body with JSON content-type",
    );

    // Clean up
    await endSession(testSessionId, headers);
  });

  it("should return 400 if body contains extra keys", async () => {
    const url = getBaseUrl();
    const testSessionId = await createSession(headers);

    const ctx = await fetchWithContext<{ success?: boolean; message?: string }>(
      `${url}/v1/sessions/${testSessionId}/end`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({ unexpected: true }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_BAD_REQUEST,
      "Should return 400 for extra keys",
    );

    // Clean up
    await endSession(testSessionId, headers);
  });

  it("should return 200 when body is {}", async () => {
    const url = getBaseUrl();
    const testSessionId = await createSession(headers);

    const ctx = await fetchWithContext<{ success: boolean }>(
      `${url}/v1/sessions/${testSessionId}/end`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({}),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Should return 200 for empty object body");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(ctx.body.success === true, "Should indicate success", ctx);
  });

  it("should return 200 when body is 0 bytes (no body)", async () => {
    const url = getBaseUrl();
    const testSessionId = await createSession(headers);

    // Send request with no body at all
    const response = await fetch(`${url}/v1/sessions/${testSessionId}/end`, {
      method: "POST",
      headers: {
        ...headers,
        // Don't set Content-Type to application/json when there's no body
      },
    });

    // Should succeed with 200 for no body
    assert.equal(
      response.status,
      HTTP_OK,
      `Should return 200 for 0-byte body, got ${response.status}`,
    );

    const body = await response.json();
    assert.equal(body.success, true, "Should indicate success");
  });

  it("should end session successfully", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{ success: boolean }>(
      `${url}/v1/sessions/${sessionId}/end`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({}),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "End session should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(ctx.body.success === true, "Should indicate success", ctx);
  });

  it("should return error for non-existent session", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{ success?: boolean; message?: string }>(
      `${url}/v1/sessions/non-existent-session-id/end`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({}),
      },
    );

    // Server returns 404 or 500 for non-existent sessions
    assert.ok(
      [HTTP_NOT_FOUND, HTTP_INTERNAL_SERVER_ERROR].includes(ctx.status),
      `Expected 404 or 500, got ${ctx.status}`,
    );

    if (ctx.status === HTTP_INTERNAL_SERVER_ERROR) {
      assertFetchOk(ctx.body !== null, "Response should have body", ctx);
      assertFetchOk(
        ctx.body.message === "An internal server error occurred",
        "500 responses should return a generic internal error message",
        ctx,
      );
    }
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/extract.test.ts
================================================
import assert from "node:assert/strict";
import { after, before, describe, it } from "node:test";

import {
  assertEventExists,
  assertFetchOk,
  assertFetchStatus,
  assertWithContext,
  createSessionWithCdp,
  endSession,
  fetchWithContext,
  GEMINI_API_KEY,
  getBaseUrl,
  getHeaders,
  getMainFrameId,
  HTTP_OK,
  navigateSession,
  readTypedSSEStreamWithContext,
  requireEnv,
} from "../utils.js";

/** Result type for extract SSE events */
type ExtractResult = Record<string, unknown>;

// Shared session for all extract tests (extract is read-only, safe to share)
let sessionId: string;
let cdpUrl: string;

before(async () => {
  ({ sessionId, cdpUrl } = await createSessionWithCdp(getHeaders("3.0.0")));
  const navResponse = await navigateSession(
    sessionId,
    "https://example.com",
    getHeaders("3.0.0"),
  );
  assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
});

after(async () => {
  await endSession(sessionId, getHeaders("3.0.0"));
});

// =============================================================================
// POST /v1/sessions/:id/extract - V3 Format Tests
// =============================================================================

describe("POST /v1/sessions/:id/extract (V3)", () => {
  it("should extract data with instruction and schema", async () => {
    const url = getBaseUrl();
    const frameId = await getMainFrameId(cdpUrl);

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "extract the page title",
          schema: {
            type: "object",
            properties: {
              title: { type: "string" },
            },
            required: ["title"],
          },
          frameId,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Extract should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
    assertFetchOk(
      "title" in ctx.body.data.result,
      "Result should have title property",
      ctx,
    );
  });

  it("should extract with instruction and options", async () => {
    const url = getBaseUrl();

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "extract the page title",
          schema: {
            type: "object",
            properties: {
              title: { type: "string" },
            },
          },
          options: {
            timeout: 30000,
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Extract with options should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
  });

  it("should extract with CSS selector in options", async () => {
    const url = getBaseUrl();

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "extract the link information",
          schema: {
            type: "object",
            properties: {
              href: { type: "string" },
              text: { type: "string" },
            },
          },
          options: {
            selector: "a", // CSS selector
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Extract with CSS selector should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
  });

  it("should extract with XPath selector in options", async () => {
    const url = getBaseUrl();

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "extract the link information",
          schema: {
            type: "object",
            properties: {
              href: { type: "string" },
              text: { type: "string" },
            },
          },
          options: {
            selector: "//a", // XPath selector
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Extract with XPath selector should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
  });

  it("should extract with instruction only (no schema)", async () => {
    const url = getBaseUrl();

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "extract the main content from the page",
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Extract without schema should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
  });

  it("should extract without instruction (extract all)", async () => {
    const url = getBaseUrl();

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          options: {
            timeout: 30000,
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Extract without instruction should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
  });

  it("should extract with google/gemini-2.5-flash-lite model", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    interface ExtractResponse {
      success: boolean;
      data?: { result: Record<string, unknown>; actionId?: string };
    }

    const ctx = await fetchWithContext<ExtractResponse>(
      `${url}/v1/sessions/${sessionId}/extract`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "extract the page title",
          schema: {
            type: "object",
            properties: {
              title: { type: "string" },
            },
            required: ["title"],
          },
          options: {
            model: {
              modelName: "google/gemini-2.5-flash-lite",
              apiKey: geminiApiKey,
            },
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Extract with Gemini model should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(!!ctx.body.data, "Response should have data", ctx);
    assertFetchOk(!!ctx.body.data.result, "Response should have result", ctx);
    assert.equal(
      typeof ctx.body.data.result,
      "object",
      "Result should be an object",
    );
    assertFetchOk(
      "title" in ctx.body.data.result,
      "Result should have title property",
      ctx,
    );
  });
});

// =============================================================================
// SSE Streaming Tests - V3
// =============================================================================

describe("POST /v1/sessions/:id/extract with SSE streaming (V3)", () => {
  it("should stream valid SSE events with correct structure", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/extract`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "extract the page title",
        schema: {
          type: "object",
          properties: {
            title: { type: "string" },
          },
          required: ["title"],
        },
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ExtractResult>(response);
    const { events } = ctx;

    assertWithContext(
      events.length >= 2,
      "Should have at least starting and finished events",
      ctx,
    );

    // Verify starting event
    const startingEvent = assertEventExists(events, "starting", ctx);
    assert.equal(
      startingEvent.type,
      "system",
      "Starting event should be system type",
    );

    // Verify finished event with result
    const finishedEvent = assertEventExists(events, "finished", ctx);
    assert.equal(
      finishedEvent.type,
      "system",
      "Finished event should be system type",
    );
    assertWithContext(
      !!finishedEvent.data.result,
      "Finished event must have result",
      ctx,
    );
    assert.equal(
      typeof finishedEvent.data.result,
      "object",
      "Result must be an object",
    );
    assertWithContext(
      "title" in finishedEvent.data.result,
      "Result should have title property",
      ctx,
    );
  });

  it("should have correct event sequence: starting -> connected -> finished", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/extract`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "extract the page title",
        schema: {
          type: "object",
          properties: {
            title: { type: "string" },
          },
        },
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ExtractResult>(response);
    const { events } = ctx;

    assertEventExists(events, "starting", ctx);
    assertEventExists(events, "connected", ctx);
    assertEventExists(events, "finished", ctx);

    const startingIndex = events.findIndex((e) => e.data.status === "starting");
    const connectedIndex = events.findIndex(
      (e) => e.data.status === "connected",
    );
    const finishedIndex = events.findIndex((e) => e.data.status === "finished");

    assertWithContext(
      startingIndex < connectedIndex,
      "Starting event must come before connected event",
      ctx,
    );
    assertWithContext(
      connectedIndex < finishedIndex,
      "Connected event must come before finished event",
      ctx,
    );
  });

  it("should have valid UUID for each event id", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/extract`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "extract the page title",
        schema: {
          type: "object",
          properties: {
            title: { type: "string" },
          },
        },
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ExtractResult>(response);
    const { events } = ctx;

    const uuidRegex =
      /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;

    for (const event of events) {
      assertWithContext(
        uuidRegex.test(event.id),
        `Event id should be a valid UUID format, got: ${event.id}`,
        ctx,
      );
    }
  });

  it("should extract data matching the provided schema", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/extract`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "extract the page title",
        schema: {
          type: "object",
          properties: {
            title: { type: "string" },
          },
          required: ["title"],
        },
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ExtractResult>(response);
    const { events } = ctx;

    const finishedEvent = assertEventExists(events, "finished", ctx);
    assertWithContext(!!finishedEvent.data.result, "Should have result", ctx);

    // Verify the extracted data has the expected shape
    assert.equal(
      typeof finishedEvent.data.result.title,
      "string",
      "Extracted title should be a string",
    );
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/multiRegion.test.ts
================================================
import { describe, it } from "node:test";

import {
  assertFetchOk,
  assertFetchStatus,
  endSession,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  HTTP_OK,
  LOCAL_BROWSER_BODY,
} from "../utils.js";

// =============================================================================
// Response Type Definitions
// =============================================================================

interface StartSuccessResponse {
  success: true;
  data: {
    sessionId: string;
    cdpUrl: string;
    available: boolean;
  };
}

interface StartErrorResponse {
  success: false;
  message: string;
}

type StartResponse = StartSuccessResponse | StartErrorResponse;

function isSuccessResponse(
  response: StartResponse,
): response is StartSuccessResponse {
  return response.success && response.data.sessionId !== null;
}

// =============================================================================
// Multi-Region Integration Tests
// =============================================================================
// These tests verify that the API client correctly handles multi-region
// configuration. Prior to the multi-region feature, non-us-west-2 regions
// would be rejected with { available: false }. Now all supported regions
// are accepted.
// =============================================================================

describe("POST /v1/sessions/start - Multi-region support", () => {
  const headers = getHeaders("3.0.0");
  const localBrowser = LOCAL_BROWSER_BODY;

  it("should start session with us-west-2 region (default)", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "us-west-2",
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    try {
      assertFetchOk(
        ctx.body.data.available,
        "Session should be available",
        ctx,
      );
      assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    } finally {
      await endSession(ctx.body.data.sessionId, headers);
    }
  });

  it("should start session with us-east-1 region", async () => {
    const url = getBaseUrl();

    // This test verifies that non-us-west-2 regions are now accepted.
    // Previously, this would have returned { available: false }.
    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "us-east-1",
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    try {
      assertFetchOk(
        ctx.body.data.available,
        "Session should be available",
        ctx,
      );
      assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    } finally {
      await endSession(ctx.body.data.sessionId, headers);
    }
  });

  it("should start session with eu-central-1 region", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "eu-central-1",
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    try {
      assertFetchOk(
        ctx.body.data.available,
        "Session should be available",
        ctx,
      );
      assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    } finally {
      await endSession(ctx.body.data.sessionId, headers);
    }
  });

  it("should start session with ap-southeast-1 region", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "ap-southeast-1",
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    try {
      assertFetchOk(
        ctx.body.data.available,
        "Session should be available",
        ctx,
      );
      assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    } finally {
      await endSession(ctx.body.data.sessionId, headers);
    }
  });

  it("should start session without region (defaults to us-west-2)", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {},
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    try {
      assertFetchOk(
        ctx.body.data.available,
        "Session should be available",
        ctx,
      );
      assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    } finally {
      await endSession(ctx.body.data.sessionId, headers);
    }
  });

  it("should start session without browserbaseSessionCreateParams", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    try {
      assertFetchOk(
        ctx.body.data.available,
        "Session should be available",
        ctx,
      );
      assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    } finally {
      await endSession(ctx.body.data.sessionId, headers);
    }
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/navigate.test.ts
================================================
import assert from "node:assert/strict";
import { after, before, describe, it } from "node:test";

import { chromium } from "playwright";

import {
  assertFetchOk,
  assertFetchStatus,
  createSessionWithCdp,
  endSession,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  HTTP_BAD_REQUEST,
  HTTP_OK,
} from "../utils.js";

// =============================================================================
// POST /v1/sessions/:id/navigate (V3 Format)
// =============================================================================

describe("POST /v1/sessions/:id/navigate (V3)", () => {
  let sessionId: string;
  let cdpUrl: string;

  before(async () => {
    ({ sessionId, cdpUrl } = await createSessionWithCdp(getHeaders("3.0.0")));
  });

  after(async () => {
    await endSession(sessionId, getHeaders("3.0.0"));
  });

  it("should navigate to a URL successfully and verify via CDP", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/navigate`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({ url: "https://example.com", frameId: "" }),
    });

    assertFetchStatus(ctx, HTTP_OK, "Navigate should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      typeof ctx.body.data.actionId === "string",
      "Response should have actionId",
      ctx,
    );

    // Verify navigation via CDP
    const browser = await chromium.connectOverCDP(cdpUrl);
    const contexts = browser.contexts();
    assert.ok(contexts.length > 0, "Should have at least one browser context");
    const pages = contexts[0]!.pages();
    assert.ok(pages.length > 0, "Should have at least one page");
    const page = pages[0]!;
    await page
      .waitForLoadState("domcontentloaded", { timeout: 15_000 })
      .catch(() => {});
    await page
      .waitForURL("**example.com**", { timeout: 15_000 })
      .catch(() => {});
    const pageUrl = page.url();
    assert.ok(
      pageUrl.includes("example.com"),
      `Page URL should be example.com, got: ${pageUrl}`,
    );
    await browser.close();
  });

  it("should navigate with options", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success: boolean;
      data?: { result: unknown; actionId?: string };
    }>(`${url}/v1/sessions/${sessionId}/navigate`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        url: "https://example.com",
        frameId: "",
        options: {
          waitUntil: "networkidle",
          timeout: 30000,
        },
      }),
    });

    assertFetchStatus(ctx, HTTP_OK, "Navigate with options should succeed");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      typeof ctx.body.data.actionId === "string",
      "Response should have actionId",
      ctx,
    );
  });

  // ===========================================================================
  // Validation Tests
  // ===========================================================================

  it("should return 400 when url is missing", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<{
      success?: boolean;
      message?: string;
      error?: string;
    }>(`${url}/v1/sessions/${sessionId}/navigate`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({ frameId: "" }), // Missing url
    });

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    // Fastify validation errors may have different format than our custom errors
    assertFetchOk(
      !ctx.body.success ||
        ctx.body.error !== undefined ||
        ctx.body.message !== undefined,
      "Response should indicate failure",
      ctx,
    );
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/observe.test.ts
================================================
import assert from "node:assert/strict";
import { after, before, describe, it } from "node:test";

import {
  assertEventExists,
  assertFetchOk,
  assertFetchStatus,
  assertWithContext,
  createSessionWithCdp,
  endSession,
  fetchWithContext,
  GEMINI_API_KEY,
  getBaseUrl,
  getHeaders,
  getMainFrameId,
  HTTP_OK,
  navigateSession,
  readTypedSSEStreamWithContext,
  requireEnv,
} from "../utils.js";

/** Result type for observe SSE events */
type ObserveResult = unknown[];

// Shared session for all observe tests (observe is read-only, safe to share)
let sessionId: string;
let cdpUrl: string;

before(async () => {
  ({ sessionId, cdpUrl } = await createSessionWithCdp(getHeaders("3.0.0")));
  // Navigate to a page first
  const navResponse = await navigateSession(
    sessionId,
    "https://example.com",
    getHeaders("3.0.0"),
  );
  assert.equal(navResponse.status, HTTP_OK, "Navigate should succeed");
});

after(async () => {
  await endSession(sessionId, getHeaders("3.0.0"));
});

// =============================================================================
// POST /v1/sessions/:id/observe - V3 Format Tests
// =============================================================================

describe("POST /v1/sessions/:id/observe (V3)", () => {
  it("should observe elements with instruction", async () => {
    const url = getBaseUrl();
    const frameId = await getMainFrameId(cdpUrl);

    interface ObserveResponse {
      success: boolean;
      data?: { result: unknown[]; actionId?: string };
    }

    const ctx = await fetchWithContext<ObserveResponse>(
      `${url}/v1/sessions/${sessionId}/observe`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "Find any link on the page",
          frameId,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Observe should succeed");
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      Array.isArray(ctx.body.data.result),
      "Result should be an array of observed elements",
      ctx,
    );
  });

  it("should observe with instruction and options", async () => {
    const url = getBaseUrl();

    interface ObserveResponse {
      success: boolean;
      data?: { result: unknown[]; actionId?: string };
    }

    const ctx = await fetchWithContext<ObserveResponse>(
      `${url}/v1/sessions/${sessionId}/observe`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "Find any link on the page",
          options: {
            timeout: 30000,
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Observe with options should succeed");
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      Array.isArray(ctx.body.data.result),
      "Result should be an array of observed elements",
      ctx,
    );
  });

  it("should observe with selector option", async () => {
    const url = getBaseUrl();

    interface ObserveResponse {
      success: boolean;
      data?: { result: unknown[]; actionId?: string };
    }

    const ctx = await fetchWithContext<ObserveResponse>(
      `${url}/v1/sessions/${sessionId}/observe`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          instruction: "Find any link on the page",
          options: {
            selector: "a",
          },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Observe with selector should succeed");
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      Array.isArray(ctx.body.data.result),
      "Result should be an array of observed elements",
      ctx,
    );
  });

  it("should observe without instruction (observe all)", async () => {
    const url = getBaseUrl();

    interface ObserveResponse {
      success: boolean;
      data?: { result: unknown[]; actionId?: string };
    }

    const ctx = await fetchWithContext<ObserveResponse>(
      `${url}/v1/sessions/${sessionId}/observe`,
      {
        method: "POST",
        headers: getHeaders("3.0.0"),
        body: JSON.stringify({
          options: {
            timeout: 30000,
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Observe without instruction should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      Array.isArray(ctx.body.data.result),
      "Result should be an array of observed elements",
      ctx,
    );
  });

  it("should observe with google/gemini-2.5-flash-lite model", async () => {
    const url = getBaseUrl();
    const geminiApiKey = requireEnv("GEMINI_API_KEY", GEMINI_API_KEY);

    interface ObserveResponse {
      success: boolean;
      data?: { result: unknown[]; actionId?: string };
    }

    const ctx = await fetchWithContext<ObserveResponse>(
      `${url}/v1/sessions/${sessionId}/observe`,
      {
        method: "POST",
        headers: {
          ...getHeaders("3.0.0"),
          "x-model-api-key": "", // Clear the header to ensure body config is used
        },
        body: JSON.stringify({
          instruction: "Find any link on the page",
          options: {
            model: {
              modelName: "google/gemini-2.5-flash-lite",
              apiKey: geminiApiKey,
            },
          },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Observe with google/gemini-2.5-flash-lite model should succeed",
    );
    assertFetchOk(ctx.body !== null, "Response body should be parseable", ctx);
    assertFetchOk(ctx.body.success, "Response should indicate success", ctx);
    assertFetchOk(
      ctx.body.data !== undefined,
      "Response should have data",
      ctx,
    );
    assertFetchOk(
      Array.isArray(ctx.body.data.result),
      "Result should be an array of observed elements",
      ctx,
    );
  });
});

// =============================================================================
// SSE Streaming Tests - V3
// =============================================================================

describe("POST /v1/sessions/:id/observe with SSE streaming (V3)", () => {
  it("should stream valid SSE events with correct structure", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/observe`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "Find any link on the page",
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ObserveResult>(response);
    const { events } = ctx;

    assertWithContext(
      events.length >= 2,
      "Should have at least starting and finished events",
      ctx,
    );

    // Verify starting event
    const startingEvent = assertEventExists(events, "starting", ctx);
    assertWithContext(
      startingEvent.type === "system",
      "Starting event should be system type",
      ctx,
    );

    // Verify finished event with result
    const finishedEvent = assertEventExists(events, "finished", ctx);
    assertWithContext(
      finishedEvent.type === "system",
      "Finished event should be system type",
      ctx,
    );
    assertWithContext(
      !!finishedEvent.data.result,
      "Finished event must have result",
      ctx,
    );
    assertWithContext(
      Array.isArray(finishedEvent.data.result),
      "Result must be an array of observed elements",
      ctx,
    );
  });

  it("should have correct event sequence: starting -> connected -> finished", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/observe`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "Find any link on the page",
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ObserveResult>(response);
    const { events } = ctx;

    assertEventExists(events, "starting", ctx);
    assertEventExists(events, "connected", ctx);
    assertEventExists(events, "finished", ctx);

    const startingIndex = events.findIndex((e) => e.data.status === "starting");
    const connectedIndex = events.findIndex(
      (e) => e.data.status === "connected",
    );
    const finishedIndex = events.findIndex((e) => e.data.status === "finished");

    assertWithContext(
      startingIndex < connectedIndex,
      "Starting event must come before connected event",
      ctx,
    );
    assertWithContext(
      connectedIndex < finishedIndex,
      "Connected event must come before finished event",
      ctx,
    );
  });

  it("should have valid UUID for each event id", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/observe`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "Find any link on the page",
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ObserveResult>(response);
    const { events } = ctx;

    const uuidRegex =
      /^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$/i;

    for (const event of events) {
      assertWithContext(
        uuidRegex.test(event.id),
        `Event id should be a valid UUID format, got: ${event.id}`,
        ctx,
      );
    }
  });

  it("should return observed elements with expected properties", async () => {
    const url = getBaseUrl();

    const response = await fetch(`${url}/v1/sessions/${sessionId}/observe`, {
      method: "POST",
      headers: getHeaders("3.0.0"),
      body: JSON.stringify({
        instruction: "Find any link on the page",
        streamResponse: true,
      }),
    });

    const ctx = await readTypedSSEStreamWithContext<ObserveResult>(response);
    const { events } = ctx;

    const finishedEvent = assertEventExists(events, "finished", ctx);
    assertWithContext(!!finishedEvent.data.result, "Should have result", ctx);
    assertWithContext(
      Array.isArray(finishedEvent.data.result),
      "Result should be an array",
      ctx,
    );

    // If there are observed elements, verify they have expected structure
    if (finishedEvent.data.result.length > 0) {
      const firstElement = finishedEvent.data.result[0] as Record<
        string,
        unknown
      >;
      assertWithContext(
        typeof firstElement === "object",
        "Each observed element should be an object",
        ctx,
      );
      // Observed elements typically have selector and description
      assertWithContext(
        "selector" in firstElement || "description" in firstElement,
        "Observed element should have selector or description",
        ctx,
      );
    }
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/replay.test.ts
================================================
import { describe, it } from "node:test";
import { Api } from "@browserbasehq/stagehand";

import {
  assertFetchOk,
  assertFetchStatus,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  HTTP_OK,
} from "../utils.js";

describe("GET /v1/sessions/:id/replay (V3)", () => {
  it("should return an empty replay result for local server", async () => {
    const url = getBaseUrl();
    const headers = getHeaders("3.0.0");

    const ctx = await fetchWithContext<unknown>(
      `${url}/v1/sessions/test-session-id/replay`,
      {
        method: "GET",
        headers,
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Replay should return 200");
    assertFetchOk(ctx.body !== null, "Response should have body", ctx);
    const parsedBody = Api.ReplayResponseSchema.safeParse(ctx.body);
    assertFetchOk(
      parsedBody.success,
      "Replay response should match schema",
      ctx,
    );
    if (!parsedBody.success) {
      return;
    }

    assertFetchOk(
      parsedBody.data.success,
      "Response should indicate success",
      ctx,
    );
    assertFetchOk(
      parsedBody.data.data !== undefined,
      "Response should include data",
      ctx,
    );
    assertFetchOk(
      Array.isArray(parsedBody.data.data.pages),
      "Replay pages should be an array",
      ctx,
    );
    assertFetchOk(
      parsedBody.data.data.pages.length === 0,
      "Replay pages should be empty on local server",
      ctx,
    );
  });
});


================================================
FILE: packages/server-v3/test/integration/v3/start.test.ts
================================================
import { spawn } from "node:child_process";
import { execFileSync } from "node:child_process";
import type { ChildProcessWithoutNullStreams } from "node:child_process";
import net from "node:net";
import { fileURLToPath } from "node:url";
import assert from "node:assert/strict";
import { afterEach, describe, it } from "node:test";
import Browserbase from "@browserbasehq/sdk";
import { chromium } from "playwright";

import {
  assertFetchOk,
  assertFetchStatus,
  endSession,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  LOCAL_BROWSER_BODY,
  HTTP_BAD_REQUEST,
  HTTP_OK,
} from "../utils.js";
import type { BrowserbaseRegion } from "@browserbasehq/stagehand";

// =============================================================================
// Response Type Definitions
// =============================================================================

interface StartSuccessResponse {
  success: true;
  data: {
    sessionId: string;
    cdpUrl: string;
    available: boolean;
  };
}

interface StartUnavailableResponse {
  success: true;
  data: {
    sessionId: null;
    available: false;
  };
}

interface StartErrorResponse {
  success: false;
  message: string;
}

type StartResponse =
  | StartSuccessResponse
  | StartUnavailableResponse
  | StartErrorResponse;

function isSuccessResponse(
  response: StartResponse,
): response is StartSuccessResponse {
  return response.success && response.data.sessionId !== null;
}

type SeaHandle = {
  proc: ChildProcessWithoutNullStreams;
  baseUrl: string;
  logs: string[];
};

type SupervisorInfo = {
  pid: number;
  args: string;
  chromePid?: number;
};

const repoRoot = (() => {
  const value = fileURLToPath(import.meta.url).replaceAll("\\", "/");
  const root = value.split("/packages/server-v3/")[0];
  if (root === value) {
    throw new Error(`Unable to determine repo root from ${value}`);
  }
  return root;
})();

const defaultSeaBinaryName = `stagehand-server-v3-${process.platform}-${process.arch}${process.platform === "win32" ? ".exe" : ""}`;
const seaBinaryPath = `${repoRoot}/packages/server-v3/dist/sea/${process.env.SEA_BINARY_NAME ?? defaultSeaBinaryName}`;
const bbApiKey = process.env.BROWSERBASE_API_KEY;
const bbProjectId = process.env.BROWSERBASE_PROJECT_ID;
const activeSea = new Set<SeaHandle>();

afterEach(async () => {
  await Promise.all(
    [...activeSea].map(async (handle) => {
      await stopSeaServer(handle);
      activeSea.delete(handle);
    }),
  );
});

function sleep(ms: number): Promise<void> {
  return new Promise((resolve) => setTimeout(resolve, ms));
}

async function getFreePort(): Promise<number> {
  return await new Promise((resolve, reject) => {
    const server = net.createServer();
    server.listen(0, "127.0.0.1", () => {
      const addr = server.address();
      if (!addr || typeof addr === "string") {
        reject(new Error("Failed to allocate an ephemeral port"));
        return;
      }
      const { port } = addr;
      server.close((error) => {
        if (error) {
          reject(error);
          return;
        }
        resolve(port);
      });
    });
    server.on("error", reject);
  });
}

function listProcesses(): Array<{ pid: number; args: string }> {
  const output = execFileSync("ps", ["-axo", "pid=,args="], {
    encoding: "utf8",
  });
  return output
    .split("\n")
    .map((line) => line.trim())
    .filter(Boolean)
    .map((line) => {
      const firstSpace = line.indexOf(" ");
      if (firstSpace === -1) {
        return { pid: Number(line), args: "" };
      }
      return {
        pid: Number(line.slice(0, firstSpace)),
        args: line.slice(firstSpace + 1),
      };
    })
    .filter((entry) => Number.isFinite(entry.pid) && entry.pid > 0);
}

function parseSupervisorConfigArg(args: string): {
  kind?: string;
  pid?: number;
  parentPid?: number;
} | null {
  const prefix = "--supervisor-config=";
  const index = args.indexOf(prefix);
  if (index === -1) return null;
  const raw = args.slice(index + prefix.length).trim();
  if (!raw) return null;
  try {
    return JSON.parse(raw) as {
      kind?: string;
      pid?: number;
      parentPid?: number;
    };
  } catch {
    return null;
  }
}

function findLocalSupervisorByParentPid(
  parentPid: number,
): SupervisorInfo | null {
  const candidates = listProcesses()
    .map((entry) => ({
      ...entry,
      config: parseSupervisorConfigArg(entry.args),
    }))
    .filter(
      (entry) =>
        entry.config?.kind === "LOCAL" && entry.config.parentPid === parentPid,
    )
    .sort((a, b) => b.pid - a.pid);

  const entry = candidates[0];
  if (!entry) return null;

  return {
    pid: entry.pid,
    args: entry.args,
    chromePid:
      typeof entry.config?.pid === "number" && Number.isFinite(entry.config.pid)
        ? entry.config.pid
        : undefined,
  };
}

function isPidAlive(pid: number): boolean {
  try {
    process.kill(pid, 0);
    return true;
  } catch (error) {
    const err = error as NodeJS.ErrnoException;
    if (err.code === "ESRCH") return false;
    return true;
  }
}

async function waitForValue<T>(
  read: () => T | null,
  timeoutMs: number,
  intervalMs = 200,
): Promise<T> {
  const startedAt = Date.now();
  while (Date.now() - startedAt < timeoutMs) {
    const value = read();
    if (value !== null) return value;
    await sleep(intervalMs);
  }
  throw new Error(`Timed out after ${timeoutMs}ms`);
}

async function waitForPidState(
  pid: number,
  shouldBeAlive: boolean,
  timeoutMs: number,
): Promise<void> {
  const startedAt = Date.now();
  while (Date.now() - startedAt < timeoutMs) {
    if (isPidAlive(pid) === shouldBeAlive) return;
    await sleep(200);
  }
  const entry = listProcesses().find((candidate) => candidate.pid === pid);
  const details = entry ? ` args=${entry.args}` : "";
  throw new Error(
    `PID ${pid} did not become ${shouldBeAlive ? "alive" : "dead"} within ${timeoutMs}ms${details}`,
  );
}

async function waitForServerReady(baseUrl: string, timeoutMs = 30_000) {
  const startedAt = Date.now();
  while (Date.now() - startedAt < timeoutMs) {
    try {
      const response = await fetch(`${baseUrl}/healthz`);
      if (response.ok) return;
    } catch {
      // retry
    }
    await sleep(500);
  }
  throw new Error(
    `Server did not become ready at ${baseUrl} within ${timeoutMs}ms`,
  );
}

async function waitForProcessExit(
  proc: ChildProcessWithoutNullStreams,
  timeoutMs: number,
): Promise<boolean> {
  if (proc.exitCode !== null) {
    return true;
  }
  return await new Promise((resolve) => {
    const timer = setTimeout(() => resolve(false), timeoutMs);
    proc.once("exit", () => {
      clearTimeout(timer);
      resolve(true);
    });
  });
}

async function startSeaServer(
  envOverrides: Record<string, string> = {},
): Promise<SeaHandle> {
  const port = await getFreePort();
  const baseUrl = `http://127.0.0.1:${port}`;
  const logs: string[] = [];
  const proc = spawn(
    seaBinaryPath,
    ["--node-options=--no-lazy --enable-source-maps"],
    {
      env: {
        ...process.env,
        ...envOverrides,
        NODE_ENV: "production",
        PORT: String(port),
        STAGEHAND_SEA_CACHE_DIR:
          process.env.STAGEHAND_SEA_CACHE_DIR ?? `${repoRoot}/.stagehand-sea`,
      },
      stdio: ["ignore", "pipe", "pipe"],
    },
  );

  proc.stdout.on("data", (chunk: Buffer) => {
    const value = chunk.toString().trim();
    if (value) logs.push(value);
  });
  proc.stderr.on("data", (chunk: Buffer) => {
    const value = chunk.toString().trim();
    if (value) logs.push(value);
  });

  if (!proc.pid) {
    throw new Error("SEA process did not provide a PID");
  }

  const handle: SeaHandle = { proc, baseUrl, logs };
  activeSea.add(handle);

  try {
    await waitForServerReady(baseUrl);
    return handle;
  } catch (error) {
    await stopSeaServer(handle);
    const tail = logs.slice(-30).join("\n");
    throw new Error(
      `Failed to start SEA server at ${baseUrl}: ${(error as Error).message}\n${tail}`,
      {
        cause: error,
      },
    );
  }
}

async function stopSeaServer(handle: SeaHandle): Promise<void> {
  const { proc } = handle;
  if (proc.exitCode !== null) return;
  try {
    proc.kill("SIGTERM");
  } catch {
    // ignore
  }
  const exited = await waitForProcessExit(proc, 5_000);
  if (!exited) {
    try {
      proc.kill("SIGKILL");
    } catch {
      // ignore
    }
    await waitForProcessExit(proc, 5_000);
  }
}

async function forceKillSeaServer(handle: SeaHandle): Promise<void> {
  const { proc } = handle;
  if (proc.exitCode !== null) return;
  try {
    proc.kill("SIGKILL");
  } catch {
    // ignore
  }
  await waitForProcessExit(proc, 5_000);
}

async function startKeepAliveFalseLocalSession(baseUrl: string): Promise<{
  sessionId: string;
  cdpUrl: string;
}> {
  const headers = getHeaders("3.0.0");
  const ctx = await fetchWithContext<StartResponse>(
    `${baseUrl}/v1/sessions/start`,
    {
      method: "POST",
      headers,
      body: JSON.stringify({
        modelName: "gpt-4.1-nano",
        keepAlive: false,
        ...LOCAL_BROWSER_BODY,
      }),
    },
  );

  assert.equal(
    ctx.status,
    HTTP_OK,
    `Expected local /start to succeed, got ${ctx.status}\n${ctx.debugSummary()}`,
  );
  assertFetchOk(ctx.body !== null, "Should have response body", ctx);
  assertFetchOk(
    isSuccessResponse(ctx.body),
    "Should return a successful start response",
    ctx,
  );
  return {
    sessionId: ctx.body.data.sessionId,
    cdpUrl: ctx.body.data.cdpUrl,
  };
}

async function startKeepAliveFalseBrowserbaseSession(
  baseUrl: string,
): Promise<string> {
  assert.ok(bbApiKey, "BROWSERBASE_API_KEY must be set");
  assert.ok(bbProjectId, "BROWSERBASE_PROJECT_ID must be set");
  const headers = {
    ...getHeaders("3.0.0"),
    "x-bb-api-key": bbApiKey,
    "x-bb-project-id": bbProjectId,
  };
  const ctx = await fetchWithContext<StartResponse>(
    `${baseUrl}/v1/sessions/start`,
    {
      method: "POST",
      headers,
      body: JSON.stringify({
        modelName: "gpt-4.1-nano",
        keepAlive: false,
        experimental: true,
        browser: { type: "browserbase" },
      }),
    },
  );

  assert.equal(
    ctx.status,
    HTTP_OK,
    `Expected browserbase /start to succeed, got ${ctx.status}\n${ctx.debugSummary()}`,
  );
  assertFetchOk(ctx.body !== null, "Should have response body", ctx);
  assertFetchOk(
    isSuccessResponse(ctx.body),
    "Should return a successful start response",
    ctx,
  );
  const sessionId = ctx.body.data.sessionId;

  // Browserbase Stagehand init is lazy; navigate once to ensure supervisor is running.
  const navigateCtx = await fetchWithContext<{ success?: boolean }>(
    `${baseUrl}/v1/sessions/${sessionId}/navigate`,
    {
      method: "POST",
      headers,
      body: JSON.stringify({ url: "https://example.com", frameId: "" }),
    },
  );
  assert.equal(
    navigateCtx.status,
    HTTP_OK,
    `Expected browserbase /navigate to succeed, got ${navigateCtx.status}\n${navigateCtx.debugSummary()}`,
  );

  return sessionId;
}

async function closeLocalBrowserViaCdp(cdpUrl: string): Promise<void> {
  const browser = await chromium.connectOverCDP(cdpUrl);
  try {
    const context = browser.contexts()[0];
    if (!context) return;
    const page = context.pages()[0] ?? (await context.newPage());
    const cdp = await context.newCDPSession(page);
    await cdp.send("Browser.close");
  } finally {
    await browser.close().catch(() => {
      // best-effort close of Playwright transport
    });
  }
}

async function waitForBrowserbaseNotRunning(
  sessionId: string,
  timeoutMs: number,
): Promise<string> {
  assert.ok(bbApiKey, "BROWSERBASE_API_KEY must be set");
  const bb = new Browserbase({ apiKey: bbApiKey });

  let lastStatus = "UNKNOWN";
  const startedAt = Date.now();
  while (Date.now() - startedAt < timeoutMs) {
    try {
      const snapshot = (await bb.sessions.retrieve(sessionId)) as {
        status?: string;
      };
      lastStatus = snapshot.status ?? "UNKNOWN";
      if (lastStatus !== "RUNNING") {
        return lastStatus;
      }
    } catch {
      return "RETRIEVE_FAILED";
    }
    await sleep(1000);
  }
  throw new Error(
    `Browserbase session ${sessionId} stayed RUNNING for ${timeoutMs}ms (last status=${lastStatus})`,
  );
}

async function requestBrowserbaseReleaseBestEffort(sessionId: string) {
  if (!bbApiKey || !bbProjectId) return;
  const bb = new Browserbase({ apiKey: bbApiKey });
  try {
    await bb.sessions.update(sessionId, {
      status: "REQUEST_RELEASE",
      projectId: bbProjectId,
    });
  } catch {
    // best-effort cleanup
  }
}

// =============================================================================
// V3 Format Tests (x-sdk-version: 3.x.x header)
// =============================================================================

describe("POST /v1/sessions/start - V3 format", () => {
  const headers = getHeaders("3.0.0");
  const localBrowser = LOCAL_BROWSER_BODY;

  it("should start session with modelName string and V3 header", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({ modelName: "gpt-4.1-nano", ...localBrowser }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    assertFetchOk(ctx.body.data.available, "Session should be available", ctx);
    assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);
    assertFetchOk(!!ctx.body.data.cdpUrl, "Should have cdpUrl", ctx);

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should start session with experimental flag", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          experimental: true,
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should accept x-language header for python V3", async () => {
    const url = getBaseUrl();
    const pythonHeaders = getHeaders("1.0.0", "python");

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers: pythonHeaders,
        body: JSON.stringify({ modelName: "gpt-4.1-nano", ...localBrowser }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );

    await endSession(ctx.body.data.sessionId, pythonHeaders);
  });

  it("should start session with extended options (timeouts, verbose)", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          actTimeoutMs: 30000,
          domSettleTimeoutMs: 5000,
          verbose: "2",
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    assertFetchOk(ctx.body.data.available, "Session should be available", ctx);
    assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should return cdpUrl as a valid WebSocket URL for local browser", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({ modelName: "gpt-4.1-nano", ...localBrowser }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    // cdpUrl should not be empty since we eagerly launch the browser
    assertFetchOk(
      ctx.body.data.cdpUrl !== "",
      "cdpUrl should not be empty",
      ctx,
    );
    // cdpUrl should be a valid WebSocket URL
    assertFetchOk(
      ctx.body.data.cdpUrl.startsWith("ws://"),
      "cdpUrl should be a WebSocket URL",
      ctx,
    );

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should return provided cdpUrl when explicit cdpUrl is passed", async () => {
    const url = getBaseUrl();
    const providedCdpUrl = "ws://localhost:9222/devtools/browser/test";

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browser: { type: "local", cdpUrl: providedCdpUrl },
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.cdpUrl === providedCdpUrl,
      "cdpUrl should match provided value",
      ctx,
    );

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should return error for browserbase requests without API key", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browser: { type: "browserbase" },
        }),
      },
    );

    // Should fail because browserbase requires x-bb-api-key header
    assertFetchStatus(ctx, HTTP_BAD_REQUEST, "Request should fail with 400");
  });

  it("should start browserbase session with API key but no project ID", async () => {
    if (!bbApiKey) return; // skip when credentials unavailable

    const url = getBaseUrl();
    const bbHeaders = {
      ...getHeaders("3.0.0"),
      "x-bb-api-key": bbApiKey,
      // intentionally omitting x-bb-project-id
    };

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers: bbHeaders,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browser: { type: "browserbase" },
        }),
      },
    );

    assertFetchStatus(
      ctx,
      HTTP_OK,
      "Request should succeed without project ID",
    );
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should return a successful start response",
      ctx,
    );

    await endSession(ctx.body.data.sessionId, bbHeaders);
  });

  // =============================================================================
  // Multi-Region Support Tests
  // =============================================================================

  it("should accept non-default region in browserbaseSessionCreateParams", async () => {
    const url = getBaseUrl();

    // Test with us-east-1 region - server should accept this request
    // Note: Local browser sessions don't actually use the region, but the server
    // should still accept the parameter without returning { available: false }
    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "us-east-1" as BrowserbaseRegion,
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    // The key assertion: non-default regions should NOT return available: false
    assertFetchOk(
      ctx.body.data.available === true,
      "Session should be available for non-default regions",
      ctx,
    );
    assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should accept eu-central-1 region in browserbaseSessionCreateParams", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "eu-central-1" as BrowserbaseRegion,
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.available === true,
      "Session should be available for eu-central-1 region",
      ctx,
    );
    assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);

    await endSession(ctx.body.data.sessionId, headers);
  });

  it("should accept ap-southeast-1 region in browserbaseSessionCreateParams", async () => {
    const url = getBaseUrl();

    const ctx = await fetchWithContext<StartResponse>(
      `${url}/v1/sessions/start`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          browserbaseSessionCreateParams: {
            region: "ap-southeast-1" as BrowserbaseRegion,
          },
          ...localBrowser,
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_OK, "Request should succeed");
    assertFetchOk(ctx.body !== null, "Should have response body", ctx);
    assertFetchOk(
      isSuccessResponse(ctx.body),
      "Should be a success response",
      ctx,
    );
    assertFetchOk(
      ctx.body.data.available === true,
      "Session should be available for ap-southeast-1 region",
      ctx,
    );
    assertFetchOk(!!ctx.body.data.sessionId, "Should have sessionId", ctx);

    await endSession(ctx.body.data.sessionId, headers);
  });
});

describe("POST /v1/sessions/start - keepAlive=false supervision in SEA", () => {
  it("spawns a supervisor and exits it when chrome dies", async () => {
    const handle = await startSeaServer();
    const seaPid = handle.proc.pid;
    assert.ok(seaPid, "SEA server must have a PID");

    const { cdpUrl } = await startKeepAliveFalseLocalSession(handle.baseUrl);
    const supervisor = await waitForValue(
      () => findLocalSupervisorByParentPid(seaPid),
      10_000,
    );

    assert.ok(
      supervisor.chromePid,
      `Expected local supervisor to include --chrome-pid. args=${supervisor.args}`,
    );
    assert.ok(
      isPidAlive(supervisor.pid),
      `Supervisor PID ${supervisor.pid} should be alive`,
    );
    assert.ok(
      isPidAlive(supervisor.chromePid),
      `Chrome PID ${supervisor.chromePid} should be alive`,
    );

    await closeLocalBrowserViaCdp(cdpUrl);

    await waitForPidState(supervisor.chromePid, false, 10_000);
    await waitForPidState(supervisor.pid, false, 10_000);
    assert.ok(
      isPidAlive(seaPid),
      "SEA process should stay alive after chrome dies",
    );
  });

  it("force-killing SEA kills local chrome and exits supervisor within 10s", async () => {
    const handle = await startSeaServer();
    const seaPid = handle.proc.pid;
    assert.ok(seaPid, "SEA server must have a PID");

    await startKeepAliveFalseLocalSession(handle.baseUrl);
    const supervisor = await waitForValue(
      () => findLocalSupervisorByParentPid(seaPid),
      10_000,
    );

    assert.ok(
      supervisor.chromePid,
      `Expected local supervisor to include --chrome-pid. args=${supervisor.args}`,
    );
    assert.ok(
      isPidAlive(supervisor.pid),
      `Supervisor PID ${supervisor.pid} should be alive`,
    );
    assert.ok(
      isPidAlive(supervisor.chromePid),
      `Chrome PID ${supervisor.chromePid} should be alive`,
    );

    await forceKillSeaServer(handle);

    await waitForPidState(supervisor.pid, false, 10_000);
    await waitForPidState(supervisor.chromePid, false, 10_000);
  });

  it("force-killing SEA ends Browserbase session when keepAlive=false", async () => {
    const handle = await startSeaServer({ BB_ENV: "prod" });
    const sessionId = await startKeepAliveFalseBrowserbaseSession(
      handle.baseUrl,
    );

    try {
      await forceKillSeaServer(handle);
      const finalStatus = await waitForBrowserbaseNotRunning(sessionId, 30_000);
      assert.notEqual(
        finalStatus,
        "RUNNING",
        "Browserbase session should not remain RUNNING after SEA kill",
      );
    } finally {
      await requestBrowserbaseReleaseBestEffort(sessionId);
    }
  });
});


================================================
FILE: packages/server-v3/tsconfig.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "outDir": "dist",
    "rootDir": "src",
    "module": "ESNext",
    "moduleResolution": "bundler",
    "verbatimModuleSyntax": false
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: packages/server-v3/tsconfig.tests.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "rootDir": "test",
    "outDir": "dist/tests",
    "declaration": false,
    "noEmit": false
  },
  "include": ["test/**/*.ts"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: packages/server-v3/vitest.config.ts
================================================
import { defineConfig } from "vitest/config";

export default defineConfig({
  test: {
    globals: true,
    environment: "node",
    include: ["test/**/*.test.ts"],
  },
});


================================================
FILE: packages/server-v4/CHANGELOG.md
================================================
# @browserbasehq/stagehand-server-v4

## 3.6.1

### Patch Changes

- Updated dependencies [[`505e8c6`](https://github.com/browserbase/stagehand/commit/505e8c6736f3706328dbc8df670c49a018058388), [`2f43ffa`](https://github.com/browserbase/stagehand/commit/2f43ffac11778152d17e4c44405770cc32c3ec8c), [`63ee247`](https://github.com/browserbase/stagehand/commit/63ee247ac6bf2992046d4f6b2759f46b15643e36), [`7dc35f5`](https://github.com/browserbase/stagehand/commit/7dc35f5e25689e6518d68b25ef71536d2781c8aa), [`335cf47`](https://github.com/browserbase/stagehand/commit/335cf4730e73bce33e92331d04bda4b0fd42685d), [`6ba0a1d`](https://github.com/browserbase/stagehand/commit/6ba0a1db7fc2d5d5a2f8927b1417d8f1d15eda10), [`4ff3bb8`](https://github.com/browserbase/stagehand/commit/4ff3bb831a6ef6e2d57148e7afb68ea8d23e395d), [`c27054b`](https://github.com/browserbase/stagehand/commit/c27054bbd0508431ade91d655f89efc87bbf5867), [`2abf5b9`](https://github.com/browserbase/stagehand/commit/2abf5b90f1e2bb1442509ef3a686b6128c9cdcf6), [`7817fcc`](https://github.com/browserbase/stagehand/commit/7817fcc315eee4455ce04567cf56c9ec801caf0b), [`7390508`](https://github.com/browserbase/stagehand/commit/73905088c5ed5923d276da9cce2efd0a0a3a46eb), [`611f43a`](https://github.com/browserbase/stagehand/commit/611f43ac8d4c580216d55d2b217c14a9a9c11013), [`521a10e`](https://github.com/browserbase/stagehand/commit/521a10e3698fc5631e219947bc90dad0f8bddaa8), [`2402a3c`](https://github.com/browserbase/stagehand/commit/2402a3c4d50270391b3e6440f4385cdcf5e1eb64)]:
  - @browserbasehq/stagehand@3.2.0


================================================
FILE: packages/server-v4/README.md
================================================
# Stagehand API

The Stagehand  is a powerful service that provides a RESTful interface for browser automation and session management using the Browserbase platform. It enables recording, playback, and manipulation of browser sessions with a focus on reliability and performance.

## 📋 Prerequisites

To run the Stagehand API locally, ensure you have the following installed:

- Node.js
- pnpm

## 🛠 Installation

1. Clone the repository:

```bash
git clone https://github.com/browserbase/stagehand/
cd stagehand/packages/server-v4
```

2. Install dependencies:

```bash
pnpm install
```

3. Set up environment variables:

```bash
cp .env.example .env
```

4. Configure your `.env` file with the environment variables required by `src/lib/env.ts` (BB environment, API base URLs, etc.).

5. `pnpm dev`


================================================
FILE: packages/server-v4/openapi.v4.yaml
================================================
openapi: "3.1.0"
info:
  title: Stagehand API v4
  version: "4.0.0"
  description: >-
    Stagehand SDK for AI browser automation [ALPHA]. This API allows clients to

    execute browser automation tasks remotely on the Browserbase cloud.

    Create a browser session with /browsersession, then use that id with page
    routes.

    Responses are streamed using Server-Sent Events (SSE) when the

    `x-stream-response: true` header is provided.


    This SDK is currently ALPHA software and is not production ready!

    Please try it and give us your feedback, stay tuned for upcoming release
    announcements!
  contact:
    name: Browserbase
    url: https://browserbase.com
components:
  securitySchemes:
    BrowserbaseApiKey:
      type: apiKey
      in: header
      name: x-bb-api-key
      description: Browserbase API key for authentication
    BrowserbaseProjectId:
      type: apiKey
      in: header
      name: x-bb-project-id
      description: Browserbase project ID
    ModelApiKey:
      type: apiKey
      in: header
      name: x-model-api-key
      description: API key for the AI model provider (OpenAI, Anthropic, etc.)
  links:
    SessionAct:
      operationId: SessionAct
      parameters:
        id: $response.body#/data/sessionId
      description: Perform an action on the session
    SessionExtract:
      operationId: SessionExtract
      parameters:
        id: $response.body#/data/sessionId
      description: Extract data from the session
    SessionObserve:
      operationId: SessionObserve
      parameters:
        id: $response.body#/data/sessionId
      description: Observe available actions on the session
    SessionNavigate:
      operationId: SessionNavigate
      parameters:
        id: $response.body#/data/sessionId
      description: Navigate to a URL in the session
    SessionAgentExecute:
      operationId: SessionAgentExecute
      parameters:
        id: $response.body#/data/sessionId
      description: Execute an agent on the session
    SessionReplay:
      operationId: SessionReplay
      parameters:
        id: $response.body#/data/sessionId
      description: Replay session metrics
    SessionEnd:
      operationId: SessionEnd
      parameters:
        id: $response.body#/data/sessionId
      description: End the session and release resources
  schemas:
    BrowserSessionLocalCreateRequest:
      type: object
      properties:
        modelName:
          description: Model name to use for AI operations
          example: openai/gpt-4.1-nano
          type: string
        domSettleTimeoutMs:
          type: number
        verbose:
          anyOf:
            - type: number
              const: 0
            - type: number
              const: 1
            - type: number
              const: 2
        systemPrompt:
          type: string
        selfHeal:
          type: boolean
        waitForCaptchaSolves:
          type: boolean
        experimental:
          type: boolean
        actTimeoutMs:
          type: number
        env:
          type: string
          const: LOCAL
        cdpUrl:
          type: string
        localBrowserLaunchOptions:
          $ref: "#/components/schemas/LocalBrowserLaunchOptions"
      required:
        - modelName
        - env
      additionalProperties: false
    BrowserSessionBrowserbaseCreateRequest:
      type: object
      properties:
        modelName:
          description: Model name to use for AI operations
          example: openai/gpt-4.1-nano
          type: string
        domSettleTimeoutMs:
          type: number
        verbose:
          anyOf:
            - type: number
              const: 0
            - type: number
              const: 1
            - type: number
              const: 2
        systemPrompt:
          type: string
        selfHeal:
          type: boolean
        waitForCaptchaSolves:
          type: boolean
        experimental:
          type: boolean
        actTimeoutMs:
          type: number
        env:
          type: string
          const: BROWSERBASE
        browserbaseSessionId:
          type: string
        browserbaseSessionCreateParams:
          $ref: "#/components/schemas/BrowserbaseSessionCreateParams"
      required:
        - modelName
        - env
      additionalProperties: false
    BrowserbaseBrowserSettings:
      type: object
      properties:
        advancedStealth:
          type: boolean
        blockAds:
          type: boolean
        context:
          $ref: "#/components/schemas/BrowserbaseContext"
        extensionId:
          type: string
        fingerprint:
          $ref: "#/components/schemas/BrowserbaseFingerprint"
        logSession:
          type: boolean
        recordSession:
          type: boolean
        solveCaptchas:
          type: boolean
        viewport:
          $ref: "#/components/schemas/BrowserbaseViewport"
    BrowserbaseContext:
      type: object
      properties:
        id:
          type: string
        persist:
          type: boolean
      required:
        - id
    BrowserbaseFingerprint:
      type: object
      properties:
        browsers:
          type: array
          items:
            type: string
            enum:
              - chrome
              - edge
              - firefox
              - safari
        devices:
          type: array
          items:
            type: string
            enum:
              - desktop
              - mobile
        httpVersion:
          type: string
          enum:
            - "1"
            - "2"
        locales:
          type: array
          items:
            type: string
        operatingSystems:
          type: array
          items:
            type: string
            enum:
              - android
              - ios
              - linux
              - macos
              - windows
        screen:
          $ref: "#/components/schemas/BrowserbaseFingerprintScreen"
    BrowserbaseFingerprintScreen:
      type: object
      properties:
        maxHeight:
          type: number
        maxWidth:
          type: number
        minHeight:
          type: number
        minWidth:
          type: number
    BrowserbaseViewport:
      type: object
      properties:
        width:
          type: number
        height:
          type: number
    ProxyConfig:
      oneOf:
        - $ref: "#/components/schemas/BrowserbaseProxyConfig"
        - $ref: "#/components/schemas/ExternalProxyConfig"
      type: object
      discriminator:
        propertyName: type
        mapping:
          browserbase: "#/components/schemas/BrowserbaseProxyConfig"
          external: "#/components/schemas/ExternalProxyConfig"
    BrowserbaseProxyConfig:
      type: object
      properties:
        type:
          type: string
          const: browserbase
        domainPattern:
          type: string
        geolocation:
          $ref: "#/components/schemas/BrowserbaseProxyGeolocation"
      required:
        - type
    BrowserbaseProxyGeolocation:
      type: object
      properties:
        country:
          type: string
        city:
          type: string
        state:
          type: string
      required:
        - country
    ExternalProxyConfig:
      type: object
      properties:
        type:
          type: string
          const: external
        server:
          type: string
        domainPattern:
          type: string
        username:
          type: string
        password:
          type: string
      required:
        - type
        - server
    BrowserbaseRegion:
      type: string
      enum:
        - us-west-2
        - us-east-1
        - eu-central-1
        - ap-southeast-1
    SessionHeaders:
      type: object
      properties:
        x-stream-response:
          description: Whether to stream the response via SSE
          example: "true"
          type: string
          enum:
            - "true"
            - "false"
    BrowserSessionAddInitScriptResult:
      type: object
      properties:
        added:
          type: boolean
      required:
        - added
      additionalProperties: false
    BrowserSessionSetExtraHTTPHeadersResult:
      type: object
      properties:
        headers:
          $ref: "#/components/schemas/PageHeaders"
      required:
        - headers
      additionalProperties: false
    BrowserSessionPagesResult:
      type: object
      properties:
        pages:
          type: array
          items:
            $ref: "#/components/schemas/BrowserSessionPage"
      required:
        - pages
      additionalProperties: false
    BrowserSessionOptionalPageResult:
      type: object
      properties:
        page:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionPage"
            - type: "null"
      required:
        - page
      additionalProperties: false
    BrowserSessionPageResult:
      type: object
      properties:
        page:
          $ref: "#/components/schemas/BrowserSessionPage"
      required:
        - page
      additionalProperties: false
    BrowserSessionFrameTreeResult:
      type: object
      properties:
        frameTree: {}
      required:
        - frameTree
      additionalProperties: false
    BrowserSessionCookiesResult:
      type: object
      properties:
        cookies:
          type: array
          items:
            $ref: "#/components/schemas/BrowserSessionCookie"
      required:
        - cookies
      additionalProperties: false
    BrowserSessionAddCookiesResult:
      type: object
      properties:
        added:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - added
      additionalProperties: false
    BrowserSessionClearCookiesResult:
      type: object
      properties:
        cleared:
          type: boolean
      required:
        - cleared
      additionalProperties: false
    BrowserSessionConnectURLResult:
      type: object
      properties:
        connectURL:
          type: string
      required:
        - connectURL
      additionalProperties: false
    BrowserSessionConfiguredViewportResult:
      $ref: "#/components/schemas/BrowserSessionViewport"
    BrowserSessionBrowserbaseSessionIDResult:
      type: object
      properties:
        browserbaseSessionID:
          anyOf:
            - type: string
            - type: "null"
      required:
        - browserbaseSessionID
      additionalProperties: false
    BrowserSessionBrowserbaseSessionURLResult:
      type: object
      properties:
        browserbaseSessionURL:
          anyOf:
            - type: string
            - type: "null"
      required:
        - browserbaseSessionURL
      additionalProperties: false
    BrowserSessionBrowserbaseDebugURLResult:
      type: object
      properties:
        browserbaseDebugURL:
          anyOf:
            - type: string
            - type: "null"
      required:
        - browserbaseDebugURL
      additionalProperties: false
    BrowserSessionIsBrowserbaseResult:
      type: object
      properties:
        isBrowserbase:
          type: boolean
      required:
        - isBrowserbase
      additionalProperties: false
    BrowserSessionIsAdvancedStealthResult:
      type: object
      properties:
        isAdvancedStealth:
          type: boolean
      required:
        - isAdvancedStealth
      additionalProperties: false
    BrowserSessionSetViewportSizeResult:
      $ref: "#/components/schemas/BrowserSessionViewport"
    BrowserSessionCloseResult:
      type: object
      properties:
        closed:
          type: boolean
      required:
        - closed
      additionalProperties: false
    PageXPathResult:
      type: object
      properties:
        xpath:
          type: string
      additionalProperties: false
    PageDragAndDropResult:
      type: object
      properties:
        fromXpath:
          type: string
        toXpath:
          type: string
      additionalProperties: false
    PageTypeResult:
      type: object
      properties:
        text:
          type: string
      required:
        - text
      additionalProperties: false
    PageKeyPressResult:
      type: object
      properties:
        key:
          type: string
      required:
        - key
      additionalProperties: false
    PageEnableCursorOverlayResult:
      type: object
      properties:
        enabled:
          type: boolean
      required:
        - enabled
      additionalProperties: false
    PageAddInitScriptResult:
      type: object
      properties:
        added:
          type: boolean
      required:
        - added
      additionalProperties: false
    PageNavigationResult:
      type: object
      properties:
        url:
          type: string
        response:
          anyOf:
            - type: object
              properties:
                url:
                  type: string
                status:
                  type: integer
                  minimum: -9007199254740991
                  maximum: 9007199254740991
                statusText:
                  type: string
                ok:
                  type: boolean
                headers:
                  $ref: "#/components/schemas/PageHeaders"
              required:
                - url
                - status
                - statusText
                - ok
                - headers
              additionalProperties: false
            - type: "null"
      required:
        - url
        - response
      additionalProperties: false
    PageTargetIdResult:
      type: object
      properties:
        targetId:
          $ref: "#/components/schemas/PageId"
      required:
        - targetId
      additionalProperties: false
    PageMainFrameIdResult:
      type: object
      properties:
        mainFrameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - mainFrameId
      additionalProperties: false
    PageMainFrameResult:
      type: object
      properties:
        frame:
          $ref: "#/components/schemas/PageFrame"
      required:
        - frame
      additionalProperties: false
    PageFrame:
      type: object
      properties:
        frameId:
          $ref: "#/components/schemas/FrameId"
        pageId:
          $ref: "#/components/schemas/PageId"
        sessionId:
          anyOf:
            - $ref: "#/components/schemas/CDPSessionId"
            - type: "null"
        isBrowserRemote:
          type: boolean
      required:
        - frameId
        - pageId
        - sessionId
        - isBrowserRemote
      additionalProperties: false
    PageFrameTreeResult:
      type: object
      properties:
        frameTree: {}
      required:
        - frameTree
      additionalProperties: false
    PageListAllFrameIdsResult:
      type: object
      properties:
        frameIds:
          type: array
          items:
            $ref: "#/components/schemas/FrameId"
      required:
        - frameIds
      additionalProperties: false
    PageGetOrdinalResult:
      type: object
      properties:
        frameId:
          $ref: "#/components/schemas/FrameId"
        ordinal:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - frameId
        - ordinal
      additionalProperties: false
    PageTitleResult:
      type: object
      properties:
        title:
          type: string
      required:
        - title
      additionalProperties: false
    PageUrlResult:
      type: object
      properties:
        url:
          type: string
      required:
        - url
      additionalProperties: false
    PageScreenshotResult:
      type: object
      properties:
        base64:
          type: string
        mimeType:
          $ref: "#/components/schemas/ScreenshotMimeType"
      required:
        - base64
        - mimeType
      additionalProperties: false
    PageSnapshotResult:
      type: object
      properties:
        formattedTree:
          type: string
        xpathMap:
          type: object
          properties: {}
          additionalProperties:
            type: string
        urlMap:
          type: object
          properties: {}
          additionalProperties:
            type: string
      required:
        - formattedTree
        - xpathMap
        - urlMap
      additionalProperties: false
    PageFramesResult:
      type: object
      properties:
        frames:
          type: array
          items:
            $ref: "#/components/schemas/PageFrame"
      required:
        - frames
      additionalProperties: false
    PageSetViewportSizeResult:
      type: object
      properties:
        width:
          type: number
          exclusiveMinimum: 0
        height:
          type: number
          exclusiveMinimum: 0
        deviceScaleFactor:
          type: number
          exclusiveMinimum: 0
      required:
        - width
        - height
      additionalProperties: false
    PageSetExtraHTTPHeadersResult:
      type: object
      properties:
        headers:
          $ref: "#/components/schemas/PageHeaders"
      required:
        - headers
      additionalProperties: false
    PageWaitForLoadStateResult:
      type: object
      properties:
        state:
          $ref: "#/components/schemas/LoadState"
      required:
        - state
      additionalProperties: false
    PageWaitForSelectorResult:
      type: object
      properties:
        selector:
          $ref: "#/components/schemas/ElementSelector"
        matched:
          type: boolean
      required:
        - selector
        - matched
      additionalProperties: false
    PageWaitForTimeoutResult:
      type: object
      properties:
        ms:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - ms
      additionalProperties: false
    PageEvaluateResult:
      type: object
      properties:
        value: {}
      required:
        - value
      additionalProperties: false
    PageSendCDPResult:
      type: object
      properties:
        value: {}
      required:
        - value
      additionalProperties: false
    PageCloseResult:
      type: object
      properties:
        closed:
          type: boolean
      required:
        - closed
      additionalProperties: false
    LocalBrowserLaunchOptions:
      type: object
      properties:
        args:
          type: array
          items:
            type: string
        executablePath:
          type: string
        port:
          type: number
        userDataDir:
          type: string
        preserveUserDataDir:
          type: boolean
        headless:
          type: boolean
        devtools:
          type: boolean
        chromiumSandbox:
          type: boolean
        ignoreDefaultArgs:
          anyOf:
            - type: boolean
            - type: array
              items:
                type: string
        proxy:
          type: object
          properties:
            server:
              type: string
            bypass:
              type: string
            username:
              type: string
            password:
              type: string
          required:
            - server
        locale:
          type: string
        viewport:
          type: object
          properties:
            width:
              type: number
            height:
              type: number
          required:
            - width
            - height
        deviceScaleFactor:
          type: number
        hasTouch:
          type: boolean
        ignoreHTTPSErrors:
          type: boolean
        cdpUrl:
          type: string
        cdpHeaders:
          type: object
          propertyNames:
            type: string
          additionalProperties:
            type: string
        connectTimeoutMs:
          type: number
        downloadsPath:
          type: string
        acceptDownloads:
          type: boolean
      additionalProperties: false
    BrowserbaseSessionCreateParams:
      type: object
      properties:
        projectId:
          type: string
        browserSettings:
          $ref: "#/components/schemas/BrowserbaseBrowserSettings"
        extensionId:
          type: string
        keepAlive:
          type: boolean
        proxies:
          anyOf:
            - type: boolean
            - type: array
              items:
                $ref: "#/components/schemas/ProxyConfig"
        region:
          $ref: "#/components/schemas/BrowserbaseRegion"
        timeout:
          type: number
        userMetadata:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
    BrowserSessionId:
      example: session_01JXAMPLE
      type: string
      minLength: 1
    BrowserSessionEnv:
      type: string
      enum:
        - LOCAL
        - BROWSERBASE
    BrowserSessionStatus:
      type: string
      enum:
        - running
        - ended
    BrowserSessionCreateRequest:
      oneOf:
        - $ref: "#/components/schemas/BrowserSessionLocalCreateRequest"
        - $ref: "#/components/schemas/BrowserSessionBrowserbaseCreateRequest"
      type: object
      discriminator:
        propertyName: env
        mapping:
          LOCAL: "#/components/schemas/BrowserSessionLocalCreateRequest"
          BROWSERBASE: "#/components/schemas/BrowserSessionBrowserbaseCreateRequest"
    BrowserSessionEndRequest:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSession:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/BrowserSessionId"
        env:
          $ref: "#/components/schemas/BrowserSessionEnv"
        status:
          $ref: "#/components/schemas/BrowserSessionStatus"
        modelName:
          type: string
        cdpUrl:
          anyOf:
            - type: string
            - type: "null"
        available:
          type: boolean
        browserbaseSessionId:
          type: string
        browserbaseSessionCreateParams:
          $ref: "#/components/schemas/BrowserbaseSessionCreateParams"
        localBrowserLaunchOptions:
          $ref: "#/components/schemas/LocalBrowserLaunchOptions"
        domSettleTimeoutMs:
          type: number
        verbose:
          anyOf:
            - type: number
              const: 0
            - type: number
              const: 1
            - type: number
              const: 2
        systemPrompt:
          type: string
        selfHeal:
          type: boolean
        waitForCaptchaSolves:
          type: boolean
        experimental:
          type: boolean
        actTimeoutMs:
          type: number
      required:
        - id
        - env
        - status
        - modelName
        - available
      additionalProperties: false
    BrowserSessionResult:
      type: object
      properties:
        browserSession:
          $ref: "#/components/schemas/BrowserSession"
      required:
        - browserSession
      additionalProperties: false
    BrowserSessionActionMethod:
      type: string
      enum:
        - addInitScript
        - setExtraHTTPHeaders
        - pages
        - activePage
        - awaitActivePage
        - resolvePageByMainFrameId
        - getFullFrameTreeByMainFrameId
        - newPage
        - cookies
        - addCookies
        - clearCookies
        - connectURL
        - configuredViewport
        - browserbaseSessionID
        - browserbaseSessionURL
        - browserbaseDebugURL
        - isBrowserbase
        - isAdvancedStealth
        - setViewportSize
        - close
    BrowserSessionActionStatus:
      type: string
      enum:
        - queued
        - running
        - completed
        - failed
        - canceled
    BrowserSessionPage:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        targetId:
          $ref: "#/components/schemas/PageId"
        mainFrameId:
          $ref: "#/components/schemas/FrameId"
        url:
          type: string
      required:
        - pageId
        - targetId
        - mainFrameId
        - url
      additionalProperties: false
    BrowserSessionCookie:
      type: object
      properties:
        name:
          type: string
        value:
          type: string
        domain:
          type: string
        path:
          type: string
        expires:
          type: number
        httpOnly:
          type: boolean
        secure:
          type: boolean
        sameSite:
          type: string
          enum:
            - Strict
            - Lax
            - None
      required:
        - name
        - value
        - domain
        - path
        - expires
        - httpOnly
        - secure
        - sameSite
      additionalProperties: false
    BrowserSessionCookieParam:
      type: object
      properties:
        name:
          type: string
        value:
          type: string
        url:
          type: string
        domain:
          type: string
        path:
          type: string
        expires:
          type: number
        httpOnly:
          type: boolean
        secure:
          type: boolean
        sameSite:
          type: string
          enum:
            - Strict
            - Lax
            - None
      required:
        - name
        - value
      additionalProperties: false
    BrowserSessionRegex:
      type: object
      properties:
        source:
          type: string
        flags:
          type: string
      required:
        - source
      additionalProperties: false
    BrowserSessionStringPattern:
      anyOf:
        - type: string
        - $ref: "#/components/schemas/BrowserSessionRegex"
    BrowserSessionClearCookiesOptions:
      type: object
      properties:
        name:
          $ref: "#/components/schemas/BrowserSessionStringPattern"
        domain:
          $ref: "#/components/schemas/BrowserSessionStringPattern"
        path:
          $ref: "#/components/schemas/BrowserSessionStringPattern"
      additionalProperties: false
    BrowserSessionViewport:
      type: object
      properties:
        width:
          type: number
          exclusiveMinimum: 0
        height:
          type: number
          exclusiveMinimum: 0
        deviceScaleFactor:
          type: number
          exclusiveMinimum: 0
      required:
        - width
        - height
      additionalProperties: false
    BrowserSessionAddInitScriptParams:
      type: object
      properties:
        script:
          $ref: "#/components/schemas/PageInitScript"
      required:
        - script
      additionalProperties: false
    BrowserSessionSetExtraHTTPHeadersParams:
      type: object
      properties:
        headers:
          $ref: "#/components/schemas/PageHeaders"
      required:
        - headers
      additionalProperties: false
    BrowserSessionPagesParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionActivePageParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionAwaitActivePageParams:
      type: object
      properties:
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      additionalProperties: false
    BrowserSessionResolvePageByMainFrameIdParams:
      type: object
      properties:
        mainFrameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - mainFrameId
      additionalProperties: false
    BrowserSessionGetFullFrameTreeByMainFrameIdParams:
      type: object
      properties:
        mainFrameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - mainFrameId
      additionalProperties: false
    BrowserSessionNewPageParams:
      type: object
      properties:
        url:
          type: string
      additionalProperties: false
    BrowserSessionCookiesParams:
      type: object
      properties:
        urls:
          anyOf:
            - type: string
            - type: array
              items:
                type: string
      additionalProperties: false
    BrowserSessionAddCookiesParams:
      type: object
      properties:
        cookies:
          type: array
          items:
            $ref: "#/components/schemas/BrowserSessionCookieParam"
      required:
        - cookies
      additionalProperties: false
    BrowserSessionClearCookiesParams:
      $ref: "#/components/schemas/BrowserSessionClearCookiesOptions"
    BrowserSessionConnectURLParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionConfiguredViewportParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionBrowserbaseSessionIDParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionBrowserbaseSessionURLParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionBrowserbaseDebugURLParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionIsBrowserbaseParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionIsAdvancedStealthParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionSetViewportSizeParams:
      $ref: "#/components/schemas/BrowserSessionViewport"
    BrowserSessionCloseParams:
      type: object
      properties: {}
      additionalProperties: false
    BrowserSessionAddInitScriptRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionAddInitScriptParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionSetExtraHTTPHeadersRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionPagesRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionPagesParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionActivePageRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionActivePageParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionAwaitActivePageRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionAwaitActivePageParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionResolvePageByMainFrameIdRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionResolvePageByMainFrameIdParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionGetFullFrameTreeByMainFrameIdRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionGetFullFrameTreeByMainFrameIdParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionNewPageRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionNewPageParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionCookiesRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionCookiesParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionAddCookiesRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionAddCookiesParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionClearCookiesRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionClearCookiesParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionConnectURLRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionConnectURLParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionConfiguredViewportRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionConfiguredViewportParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionBrowserbaseSessionIDRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionBrowserbaseSessionURLRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionBrowserbaseDebugURLRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionAddInitScriptAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: addInitScript
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionAddInitScriptParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionAddInitScriptResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionSetExtraHTTPHeadersAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: setExtraHTTPHeaders
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionPagesAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: pages
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionPagesParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionPagesResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionActivePageAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: activePage
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionActivePageParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionOptionalPageResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionAwaitActivePageAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: awaitActivePage
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionAwaitActivePageParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionPageResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionResolvePageByMainFrameIdAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: resolvePageByMainFrameId
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionResolvePageByMainFrameIdParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionOptionalPageResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionGetFullFrameTreeByMainFrameIdAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: getFullFrameTreeByMainFrameId
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionGetFullFrameTreeByMainFrameIdParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionFrameTreeResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionNewPageAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: newPage
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionNewPageParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionPageResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionCookiesAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: cookies
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionCookiesParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionCookiesResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionAddCookiesAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: addCookies
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionAddCookiesParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionAddCookiesResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionClearCookiesAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: clearCookies
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionClearCookiesParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionClearCookiesResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionConnectURLAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: connectURL
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionConnectURLParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionConnectURLResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionConfiguredViewportAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: configuredViewport
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionConfiguredViewportParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionConfiguredViewportResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionBrowserbaseSessionIDAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: browserbaseSessionID
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionBrowserbaseSessionURLAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: browserbaseSessionURL
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionBrowserbaseDebugURLAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: browserbaseDebugURL
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionIsBrowserbaseAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: isBrowserbase
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionIsBrowserbaseParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionIsBrowserbaseResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionIsAdvancedStealthAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: isAdvancedStealth
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionIsAdvancedStealthParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionIsAdvancedStealthResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionSetViewportSizeAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: setViewportSize
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionSetViewportSizeParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionSetViewportSizeResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionCloseAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: close
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
        params:
          $ref: "#/components/schemas/BrowserSessionCloseParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/BrowserSessionCloseResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    BrowserSessionAction:
      anyOf:
        - $ref: "#/components/schemas/BrowserSessionAddInitScriptAction"
        - $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersAction"
        - $ref: "#/components/schemas/BrowserSessionPagesAction"
        - $ref: "#/components/schemas/BrowserSessionActivePageAction"
        - $ref: "#/components/schemas/BrowserSessionAwaitActivePageAction"
        - $ref: "#/components/schemas/BrowserSessionResolvePageByMainFrameIdAction"
        - $ref: "#/components/schemas/BrowserSessionGetFullFrameTreeByMainFrameIdAction"
        - $ref: "#/components/schemas/BrowserSessionNewPageAction"
        - $ref: "#/components/schemas/BrowserSessionCookiesAction"
        - $ref: "#/components/schemas/BrowserSessionAddCookiesAction"
        - $ref: "#/components/schemas/BrowserSessionClearCookiesAction"
        - $ref: "#/components/schemas/BrowserSessionConnectURLAction"
        - $ref: "#/components/schemas/BrowserSessionConfiguredViewportAction"
        - $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDAction"
        - $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLAction"
        - $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLAction"
        - $ref: "#/components/schemas/BrowserSessionIsBrowserbaseAction"
        - $ref: "#/components/schemas/BrowserSessionIsAdvancedStealthAction"
        - $ref: "#/components/schemas/BrowserSessionSetViewportSizeAction"
        - $ref: "#/components/schemas/BrowserSessionCloseAction"
    RequestId:
      example: req_01JXAMPLE
      type: string
      minLength: 1
    SessionId:
      example: session_01JXAMPLE
      type: string
      minLength: 1
    PageId:
      example: target_01JXAMPLE
      type: string
      minLength: 1
    FrameId:
      example: frame_01JXAMPLE
      type: string
      minLength: 1
    ActionId:
      example: action_01JXAMPLE
      type: string
      minLength: 1
    CDPSessionId:
      example: cdp-session_01JXAMPLE
      type: string
      minLength: 1
    Timestamp:
      example: 2026-02-03T12:00:00.000Z
      type: string
      format: date-time
      pattern: ^(?:(?:\d\d[2468][048]|\d\d[13579][26]|\d\d0[48]|[02468][048]00|[13579][26]00)-02-29|\d{4}-(?:(?:0[13578]|1[02])-(?:0[1-9]|[12]\d|3[01])|(?:0[469]|11)-(?:0[1-9]|[12]\d|30)|(?:02)-(?:0[1-9]|1\d|2[0-8])))T(?:(?:[01]\d|2[0-3]):[0-5]\d(?::[0-5]\d(?:\.\d+)?)?(?:Z))$
    MouseButton:
      type: string
      enum:
        - left
        - right
        - middle
    LoadState:
      type: string
      enum:
        - load
        - domcontentloaded
        - networkidle
    WaitForSelectorState:
      type: string
      enum:
        - attached
        - detached
        - visible
        - hidden
    ScreenshotType:
      type: string
      enum:
        - png
        - jpeg
    ScreenshotMimeType:
      type: string
      enum:
        - image/png
        - image/jpeg
    ScreenshotScale:
      type: string
      enum:
        - css
        - device
    ScreenshotAnimations:
      type: string
      enum:
        - allow
        - disabled
    ScreenshotCaret:
      type: string
      enum:
        - hide
        - initial
    PageActionMethod:
      type: string
      enum:
        - click
        - hover
        - scroll
        - dragAndDrop
        - type
        - keyPress
        - enableCursorOverlay
        - addInitScript
        - goto
        - reload
        - goBack
        - goForward
        - targetId
        - mainFrameId
        - mainFrame
        - getFullFrameTree
        - asProtocolFrameTree
        - listAllFrameIds
        - getOrdinal
        - title
        - url
        - screenshot
        - snapshot
        - frames
        - setViewportSize
        - setExtraHTTPHeaders
        - waitForLoadState
        - waitForMainLoadState
        - waitForSelector
        - waitForTimeout
        - evaluate
        - sendCDP
        - close
    PageActionStatus:
      type: string
      enum:
        - queued
        - running
        - completed
        - failed
        - canceled
    XPathSelector:
      type: object
      properties:
        xpath:
          example: //button[text()='Submit']
          type: string
          minLength: 1
        idx:
          example: 0
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - xpath
      additionalProperties: false
    CssSelector:
      type: object
      properties:
        css:
          example: .btn-submit
          type: string
          minLength: 1
        idx:
          example: 0
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - css
      additionalProperties: false
    TextSelector:
      type: object
      properties:
        text:
          example: Submit
          type: string
          minLength: 1
        idx:
          example: 0
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - text
      additionalProperties: false
    CoordinateSelector:
      type: object
      properties:
        x:
          type: number
        y:
          type: number
      required:
        - x
        - y
      additionalProperties: false
    Selector:
      anyOf:
        - $ref: "#/components/schemas/XPathSelector"
        - $ref: "#/components/schemas/CssSelector"
        - $ref: "#/components/schemas/TextSelector"
        - $ref: "#/components/schemas/CoordinateSelector"
    ElementSelector:
      anyOf:
        - $ref: "#/components/schemas/XPathSelector"
        - $ref: "#/components/schemas/CssSelector"
        - $ref: "#/components/schemas/TextSelector"
    PageHeaders:
      type: object
      properties: {}
      additionalProperties:
        type: string
    PageInitScript:
      anyOf:
        - type: string
          minLength: 1
        - type: object
          properties:
            path:
              type: string
              minLength: 1
            content:
              type: string
              minLength: 1
          additionalProperties: false
    PageClip:
      type: object
      properties:
        x:
          type: number
        y:
          type: number
        width:
          type: integer
          exclusiveMinimum: 0
          maximum: 9007199254740991
        height:
          type: integer
          exclusiveMinimum: 0
          maximum: 9007199254740991
      required:
        - x
        - y
        - width
        - height
      additionalProperties: false
    PageError:
      type: string
      minLength: 1
    PageClickParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        selector:
          $ref: "#/components/schemas/Selector"
        button:
          $ref: "#/components/schemas/MouseButton"
        clickCount:
          type: integer
          minimum: 1
          maximum: 9007199254740991
      required:
        - selector
      additionalProperties: false
    PageHoverParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        selector:
          $ref: "#/components/schemas/Selector"
      required:
        - selector
      additionalProperties: false
    PageScrollElementParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        selector:
          $ref: "#/components/schemas/ElementSelector"
        percentage:
          type: number
          minimum: 0
          maximum: 100
      required:
        - selector
        - percentage
      additionalProperties: false
    PageScrollCoordinateParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        selector:
          $ref: "#/components/schemas/CoordinateSelector"
        deltaX:
          type: number
        deltaY:
          type: number
      required:
        - selector
        - deltaY
      additionalProperties: false
    PageScrollParams:
      anyOf:
        - $ref: "#/components/schemas/PageScrollElementParams"
        - $ref: "#/components/schemas/PageScrollCoordinateParams"
    PageDragAndDropParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        from:
          $ref: "#/components/schemas/Selector"
        to:
          $ref: "#/components/schemas/Selector"
        button:
          $ref: "#/components/schemas/MouseButton"
        steps:
          type: integer
          exclusiveMinimum: 0
          maximum: 9007199254740991
        delay:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - from
        - to
      additionalProperties: false
    PageTypeParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        text:
          type: string
        delay:
          type: integer
          minimum: 0
          maximum: 9007199254740991
        withMistakes:
          type: boolean
      required:
        - text
      additionalProperties: false
    PageKeyPressParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        key:
          type: string
          minLength: 1
        delay:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - key
      additionalProperties: false
    PageEnableCursorOverlayParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageAddInitScriptParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        script:
          $ref: "#/components/schemas/PageInitScript"
      required:
        - script
      additionalProperties: false
    PageGotoParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        url:
          type: string
          format: uri
        waitUntil:
          $ref: "#/components/schemas/LoadState"
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - url
      additionalProperties: false
    PageReloadParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        waitUntil:
          $ref: "#/components/schemas/LoadState"
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
        ignoreCache:
          type: boolean
      additionalProperties: false
    PageGoBackParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        waitUntil:
          $ref: "#/components/schemas/LoadState"
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      additionalProperties: false
    PageGoForwardParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        waitUntil:
          $ref: "#/components/schemas/LoadState"
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      additionalProperties: false
    PageTargetIdParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageMainFrameIdParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageMainFrameParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageGetFullFrameTreeParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageAsProtocolFrameTreeParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        rootMainFrameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - rootMainFrameId
      additionalProperties: false
    PageListAllFrameIdsParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageGetOrdinalParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        frameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - frameId
      additionalProperties: false
    PageTitleParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageUrlParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageScreenshotParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        fullPage:
          type: boolean
        clip:
          $ref: "#/components/schemas/PageClip"
        type:
          $ref: "#/components/schemas/ScreenshotType"
        quality:
          type: integer
          minimum: 0
          maximum: 100
        scale:
          $ref: "#/components/schemas/ScreenshotScale"
        animations:
          $ref: "#/components/schemas/ScreenshotAnimations"
        caret:
          $ref: "#/components/schemas/ScreenshotCaret"
        style:
          type: string
        omitBackground:
          type: boolean
        timeout:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      additionalProperties: false
    PageSnapshotParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        includeIframes:
          type: boolean
      additionalProperties: false
    PageFramesParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageSetViewportSizeParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        width:
          type: number
          exclusiveMinimum: 0
        height:
          type: number
          exclusiveMinimum: 0
        deviceScaleFactor:
          type: number
          exclusiveMinimum: 0
      required:
        - width
        - height
      additionalProperties: false
    PageSetExtraHTTPHeadersParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        headers:
          $ref: "#/components/schemas/PageHeaders"
      required:
        - headers
      additionalProperties: false
    PageWaitForLoadStateParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        state:
          $ref: "#/components/schemas/LoadState"
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - state
      additionalProperties: false
    PageWaitForMainLoadStateParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        state:
          $ref: "#/components/schemas/LoadState"
        timeoutMs:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - state
      additionalProperties: false
    PageWaitForSelectorParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        selector:
          $ref: "#/components/schemas/ElementSelector"
        state:
          $ref: "#/components/schemas/WaitForSelectorState"
        timeout:
          type: integer
          minimum: 0
          maximum: 9007199254740991
        pierceShadow:
          type: boolean
      required:
        - selector
      additionalProperties: false
    PageWaitForTimeoutParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        ms:
          type: integer
          minimum: 0
          maximum: 9007199254740991
      required:
        - ms
      additionalProperties: false
    PageEvaluateParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        expression:
          type: string
          minLength: 1
        arg: {}
      required:
        - expression
      additionalProperties: false
    PageSendCDPParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
        method:
          type: string
          minLength: 1
        params: {}
      required:
        - method
      additionalProperties: false
    PageCloseParams:
      type: object
      properties:
        pageId:
          $ref: "#/components/schemas/PageId"
      additionalProperties: false
    PageClickRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageClickParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageHoverRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageHoverParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageScrollRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageScrollParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageDragAndDropRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageDragAndDropParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageTypeRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageTypeParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageKeyPressRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageKeyPressParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageEnableCursorOverlayRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageEnableCursorOverlayParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageAddInitScriptRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageAddInitScriptParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageGotoRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageGotoParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageReloadRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageReloadParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageGoBackRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageGoBackParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageGoForwardRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageGoForwardParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageScreenshotRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageScreenshotParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageSnapshotRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageSnapshotParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageSetViewportSizeRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageSetViewportSizeParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageSetExtraHTTPHeadersRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageSetExtraHTTPHeadersParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageWaitForLoadStateRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageWaitForLoadStateParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageWaitForMainLoadStateRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageWaitForMainLoadStateParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageWaitForSelectorRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageWaitForSelectorParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageWaitForTimeoutRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageWaitForTimeoutParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageEvaluateRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageEvaluateParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageSendCDPRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageSendCDPParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageCloseRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        params:
          $ref: "#/components/schemas/PageCloseParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    PageClickAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: click
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageClickParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageXPathResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageHoverAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: hover
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageHoverParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageXPathResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageScrollAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: scroll
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageScrollParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageXPathResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageDragAndDropAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: dragAndDrop
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageDragAndDropParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageDragAndDropResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageTypeAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: type
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageTypeParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageTypeResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageKeyPressAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: keyPress
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageKeyPressParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageKeyPressResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageEnableCursorOverlayAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: enableCursorOverlay
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageEnableCursorOverlayParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageEnableCursorOverlayResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageAddInitScriptAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: addInitScript
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageAddInitScriptParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageAddInitScriptResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageGotoAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: goto
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageGotoParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageNavigationResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageReloadAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: reload
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageReloadParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageNavigationResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageGoBackAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: goBack
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageGoBackParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageNavigationResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageGoForwardAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: goForward
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageGoForwardParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageNavigationResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageTargetIdAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: targetId
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageTargetIdParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageTargetIdResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageMainFrameIdAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: mainFrameId
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageMainFrameIdParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageMainFrameIdResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageMainFrameAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: mainFrame
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageMainFrameParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageMainFrameResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageGetFullFrameTreeAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: getFullFrameTree
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageGetFullFrameTreeParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageFrameTreeResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageAsProtocolFrameTreeAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: asProtocolFrameTree
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageAsProtocolFrameTreeParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageFrameTreeResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageListAllFrameIdsAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: listAllFrameIds
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageListAllFrameIdsParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageListAllFrameIdsResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageGetOrdinalAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: getOrdinal
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageGetOrdinalParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageGetOrdinalResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageTitleAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: title
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageTitleParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageTitleResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageUrlAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: url
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageUrlParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageUrlResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageScreenshotAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: screenshot
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageScreenshotParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageScreenshotResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageSnapshotAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: snapshot
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageSnapshotParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageSnapshotResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageFramesAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: frames
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageFramesParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageFramesResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageSetViewportSizeAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: setViewportSize
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageSetViewportSizeParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageSetViewportSizeResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageSetExtraHTTPHeadersAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: setExtraHTTPHeaders
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageSetExtraHTTPHeadersParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageSetExtraHTTPHeadersResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageWaitForLoadStateAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: waitForLoadState
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageWaitForLoadStateParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageWaitForLoadStateResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageWaitForMainLoadStateAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: waitForMainLoadState
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageWaitForMainLoadStateParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageWaitForLoadStateResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageWaitForSelectorAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: waitForSelector
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageWaitForSelectorParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageWaitForSelectorResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageWaitForTimeoutAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: waitForTimeout
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageWaitForTimeoutParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageWaitForTimeoutResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageEvaluateAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: evaluate
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageEvaluateParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageEvaluateResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageSendCDPAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: sendCDP
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageSendCDPParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageSendCDPResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageCloseAction:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          type: string
          const: close
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
        params:
          $ref: "#/components/schemas/PageCloseParams"
        result:
          anyOf:
            - $ref: "#/components/schemas/PageCloseResult"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
        - params
        - result
      additionalProperties: false
    PageAction:
      anyOf:
        - $ref: "#/components/schemas/PageClickAction"
        - $ref: "#/components/schemas/PageHoverAction"
        - $ref: "#/components/schemas/PageScrollAction"
        - $ref: "#/components/schemas/PageDragAndDropAction"
        - $ref: "#/components/schemas/PageTypeAction"
        - $ref: "#/components/schemas/PageKeyPressAction"
        - $ref: "#/components/schemas/PageEnableCursorOverlayAction"
        - $ref: "#/components/schemas/PageAddInitScriptAction"
        - $ref: "#/components/schemas/PageGotoAction"
        - $ref: "#/components/schemas/PageReloadAction"
        - $ref: "#/components/schemas/PageGoBackAction"
        - $ref: "#/components/schemas/PageGoForwardAction"
        - $ref: "#/components/schemas/PageTargetIdAction"
        - $ref: "#/components/schemas/PageMainFrameIdAction"
        - $ref: "#/components/schemas/PageMainFrameAction"
        - $ref: "#/components/schemas/PageGetFullFrameTreeAction"
        - $ref: "#/components/schemas/PageAsProtocolFrameTreeAction"
        - $ref: "#/components/schemas/PageListAllFrameIdsAction"
        - $ref: "#/components/schemas/PageGetOrdinalAction"
        - $ref: "#/components/schemas/PageTitleAction"
        - $ref: "#/components/schemas/PageUrlAction"
        - $ref: "#/components/schemas/PageScreenshotAction"
        - $ref: "#/components/schemas/PageSnapshotAction"
        - $ref: "#/components/schemas/PageFramesAction"
        - $ref: "#/components/schemas/PageSetViewportSizeAction"
        - $ref: "#/components/schemas/PageSetExtraHTTPHeadersAction"
        - $ref: "#/components/schemas/PageWaitForLoadStateAction"
        - $ref: "#/components/schemas/PageWaitForMainLoadStateAction"
        - $ref: "#/components/schemas/PageWaitForSelectorAction"
        - $ref: "#/components/schemas/PageWaitForTimeoutAction"
        - $ref: "#/components/schemas/PageEvaluateAction"
        - $ref: "#/components/schemas/PageSendCDPAction"
        - $ref: "#/components/schemas/PageCloseAction"
    BrowserSessionResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        data:
          $ref: "#/components/schemas/BrowserSessionResultOutput"
      required:
        - success
        - data
      additionalProperties: false
    BrowserSessionErrorResponse:
      type: object
      properties:
        success:
          type: boolean
          const: false
        message:
          type: string
      required:
        - success
        - message
      additionalProperties: false
    BrowserSessionV4ErrorResponse:
      type: object
      properties:
        success:
          type: boolean
          const: false
        error:
          type: string
        statusCode:
          type: integer
          minimum: -9007199254740991
          maximum: 9007199254740991
        stack:
          anyOf:
            - type: string
            - type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionAction"
      required:
        - success
        - error
        - statusCode
        - stack
      additionalProperties: false
    BrowserSessionAddInitScriptResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionAddInitScriptAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionSetExtraHTTPHeadersResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionPagesResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionPagesAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionActivePageResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionActivePageAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionAwaitActivePageResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionAwaitActivePageAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionResolvePageByMainFrameIdResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionResolvePageByMainFrameIdAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionGetFullFrameTreeByMainFrameIdResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionGetFullFrameTreeByMainFrameIdAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionNewPageResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionNewPageAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionCookiesResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionCookiesAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionAddCookiesResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionAddCookiesAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionClearCookiesResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionClearCookiesAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionConnectURLResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionConnectURLAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionConfiguredViewportResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionConfiguredViewportAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionBrowserbaseSessionIDResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionBrowserbaseSessionURLResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionBrowserbaseDebugURLResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionActionDetailsResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionActionListResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        actions:
          type: array
          items:
            $ref: "#/components/schemas/BrowserSessionAction"
      required:
        - success
        - error
        - actions
      additionalProperties: false
    V4ErrorResponse:
      type: object
      properties:
        success:
          type: boolean
          const: false
        error:
          $ref: "#/components/schemas/PageError"
        statusCode:
          type: integer
          minimum: -9007199254740991
          maximum: 9007199254740991
        stack:
          anyOf:
            - type: string
            - type: "null"
        action:
          $ref: "#/components/schemas/PageAction"
      required:
        - success
        - error
        - statusCode
        - stack
      additionalProperties: false
    PageClickResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageClickAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageHoverResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageHoverAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageScrollResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageScrollAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageDragAndDropResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageDragAndDropAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageTypeResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageTypeAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageKeyPressResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageKeyPressAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageEnableCursorOverlayResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageEnableCursorOverlayAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageAddInitScriptResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageAddInitScriptAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageGotoResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageGotoAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageReloadResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageReloadAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageGoBackResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageGoBackAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageGoForwardResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageGoForwardAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageTargetIdResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageTargetIdAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageMainFrameIdResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageMainFrameIdAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageMainFrameResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageMainFrameAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageGetFullFrameTreeResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageGetFullFrameTreeAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageAsProtocolFrameTreeResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageAsProtocolFrameTreeAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageListAllFrameIdsResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageListAllFrameIdsAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageGetOrdinalResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageGetOrdinalAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageTitleResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageTitleAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageUrlResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageUrlAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageScreenshotResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageScreenshotAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageSnapshotResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageSnapshotAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageFramesResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageFramesAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageSetViewportSizeResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageSetViewportSizeAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageSetExtraHTTPHeadersResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageSetExtraHTTPHeadersAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageWaitForLoadStateResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageWaitForLoadStateAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageWaitForMainLoadStateResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageWaitForMainLoadStateAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageWaitForSelectorResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageWaitForSelectorAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageWaitForTimeoutResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageWaitForTimeoutAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageEvaluateResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageEvaluateAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageSendCDPResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageSendCDPAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageCloseResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageCloseAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageActionDetailsResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/PageAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    PageActionListResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        actions:
          type: array
          items:
            $ref: "#/components/schemas/PageAction"
      required:
        - success
        - error
        - actions
      additionalProperties: false
    BrowserbaseBrowserSettingsOutput:
      type: object
      properties:
        advancedStealth:
          type: boolean
        blockAds:
          type: boolean
        context:
          $ref: "#/components/schemas/BrowserbaseContextOutput"
        extensionId:
          type: string
        fingerprint:
          $ref: "#/components/schemas/BrowserbaseFingerprintOutput"
        logSession:
          type: boolean
        recordSession:
          type: boolean
        solveCaptchas:
          type: boolean
        viewport:
          $ref: "#/components/schemas/BrowserbaseViewportOutput"
      additionalProperties: false
    BrowserbaseContextOutput:
      type: object
      properties:
        id:
          type: string
        persist:
          type: boolean
      required:
        - id
      additionalProperties: false
    BrowserbaseFingerprintOutput:
      type: object
      properties:
        browsers:
          type: array
          items:
            type: string
            enum:
              - chrome
              - edge
              - firefox
              - safari
        devices:
          type: array
          items:
            type: string
            enum:
              - desktop
              - mobile
        httpVersion:
          type: string
          enum:
            - "1"
            - "2"
        locales:
          type: array
          items:
            type: string
        operatingSystems:
          type: array
          items:
            type: string
            enum:
              - android
              - ios
              - linux
              - macos
              - windows
        screen:
          $ref: "#/components/schemas/BrowserbaseFingerprintScreenOutput"
      additionalProperties: false
    BrowserbaseFingerprintScreenOutput:
      type: object
      properties:
        maxHeight:
          type: number
        maxWidth:
          type: number
        minHeight:
          type: number
        minWidth:
          type: number
      additionalProperties: false
    BrowserbaseViewportOutput:
      type: object
      properties:
        width:
          type: number
        height:
          type: number
      additionalProperties: false
    ProxyConfigOutput:
      oneOf:
        - $ref: "#/components/schemas/BrowserbaseProxyConfigOutput"
        - $ref: "#/components/schemas/ExternalProxyConfigOutput"
      type: object
      discriminator:
        propertyName: type
        mapping:
          browserbase: "#/components/schemas/BrowserbaseProxyConfigOutput"
          external: "#/components/schemas/ExternalProxyConfigOutput"
    BrowserbaseProxyConfigOutput:
      type: object
      properties:
        type:
          type: string
          const: browserbase
        domainPattern:
          type: string
        geolocation:
          $ref: "#/components/schemas/BrowserbaseProxyGeolocationOutput"
      required:
        - type
      additionalProperties: false
    BrowserbaseProxyGeolocationOutput:
      type: object
      properties:
        country:
          type: string
        city:
          type: string
        state:
          type: string
      required:
        - country
      additionalProperties: false
    ExternalProxyConfigOutput:
      type: object
      properties:
        type:
          type: string
          const: external
        server:
          type: string
        domainPattern:
          type: string
        username:
          type: string
        password:
          type: string
      required:
        - type
        - server
      additionalProperties: false
    SessionHeadersOutput:
      type: object
      properties:
        x-stream-response:
          description: Whether to stream the response via SSE
          example: "true"
          type: string
          enum:
            - "true"
            - "false"
      additionalProperties: false
    BrowserSessionLocalCreateRequestOutput:
      type: object
      properties:
        modelName:
          description: Model name to use for AI operations
          example: openai/gpt-4.1-nano
          type: string
        domSettleTimeoutMs:
          type: number
        verbose:
          anyOf:
            - type: number
              const: 0
            - type: number
              const: 1
            - type: number
              const: 2
        systemPrompt:
          type: string
        selfHeal:
          type: boolean
        waitForCaptchaSolves:
          type: boolean
        experimental:
          type: boolean
        actTimeoutMs:
          type: number
        env:
          type: string
          const: LOCAL
        cdpUrl:
          type: string
        localBrowserLaunchOptions:
          $ref: "#/components/schemas/LocalBrowserLaunchOptionsOutput"
      required:
        - modelName
        - env
      additionalProperties: false
    BrowserSessionBrowserbaseCreateRequestOutput:
      type: object
      properties:
        modelName:
          description: Model name to use for AI operations
          example: openai/gpt-4.1-nano
          type: string
        domSettleTimeoutMs:
          type: number
        verbose:
          anyOf:
            - type: number
              const: 0
            - type: number
              const: 1
            - type: number
              const: 2
        systemPrompt:
          type: string
        selfHeal:
          type: boolean
        waitForCaptchaSolves:
          type: boolean
        experimental:
          type: boolean
        actTimeoutMs:
          type: number
        env:
          type: string
          const: BROWSERBASE
        browserbaseSessionId:
          type: string
        browserbaseSessionCreateParams:
          $ref: "#/components/schemas/BrowserbaseSessionCreateParamsOutput"
      required:
        - modelName
        - env
      additionalProperties: false
    LocalBrowserLaunchOptionsOutput:
      type: object
      properties:
        args:
          type: array
          items:
            type: string
        executablePath:
          type: string
        port:
          type: number
        userDataDir:
          type: string
        preserveUserDataDir:
          type: boolean
        headless:
          type: boolean
        devtools:
          type: boolean
        chromiumSandbox:
          type: boolean
        ignoreDefaultArgs:
          anyOf:
            - type: boolean
            - type: array
              items:
                type: string
        proxy:
          type: object
          properties:
            server:
              type: string
            bypass:
              type: string
            username:
              type: string
            password:
              type: string
          required:
            - server
          additionalProperties: false
        locale:
          type: string
        viewport:
          type: object
          properties:
            width:
              type: number
            height:
              type: number
          required:
            - width
            - height
          additionalProperties: false
        deviceScaleFactor:
          type: number
        hasTouch:
          type: boolean
        ignoreHTTPSErrors:
          type: boolean
        cdpUrl:
          type: string
        cdpHeaders:
          type: object
          propertyNames:
            type: string
          additionalProperties:
            type: string
        connectTimeoutMs:
          type: number
        downloadsPath:
          type: string
        acceptDownloads:
          type: boolean
      additionalProperties: false
    BrowserbaseSessionCreateParamsOutput:
      type: object
      properties:
        projectId:
          type: string
        browserSettings:
          $ref: "#/components/schemas/BrowserbaseBrowserSettingsOutput"
        extensionId:
          type: string
        keepAlive:
          type: boolean
        proxies:
          anyOf:
            - type: boolean
            - type: array
              items:
                $ref: "#/components/schemas/ProxyConfigOutput"
        region:
          $ref: "#/components/schemas/BrowserbaseRegion"
        timeout:
          type: number
        userMetadata:
          type: object
          propertyNames:
            type: string
          additionalProperties: {}
      additionalProperties: false
    BrowserSessionOutput:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/BrowserSessionId"
        env:
          $ref: "#/components/schemas/BrowserSessionEnv"
        status:
          $ref: "#/components/schemas/BrowserSessionStatus"
        modelName:
          type: string
        cdpUrl:
          anyOf:
            - type: string
            - type: "null"
        available:
          type: boolean
        browserbaseSessionId:
          type: string
        browserbaseSessionCreateParams:
          $ref: "#/components/schemas/BrowserbaseSessionCreateParamsOutput"
        localBrowserLaunchOptions:
          $ref: "#/components/schemas/LocalBrowserLaunchOptionsOutput"
        domSettleTimeoutMs:
          type: number
        verbose:
          anyOf:
            - type: number
              const: 0
            - type: number
              const: 1
            - type: number
              const: 2
        systemPrompt:
          type: string
        selfHeal:
          type: boolean
        waitForCaptchaSolves:
          type: boolean
        experimental:
          type: boolean
        actTimeoutMs:
          type: number
      required:
        - id
        - env
        - status
        - modelName
        - available
      additionalProperties: false
    BrowserSessionResultOutput:
      type: object
      properties:
        browserSession:
          $ref: "#/components/schemas/BrowserSessionOutput"
      required:
        - browserSession
      additionalProperties: false
    BrowserSessionHeaders:
      $ref: "#/components/schemas/SessionHeadersOutput"
    BrowserSessionIdParams:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/BrowserSessionId"
      required:
        - id
      additionalProperties: false
    BrowserSessionActionBase:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          $ref: "#/components/schemas/BrowserSessionActionMethod"
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - type: string
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
      additionalProperties: false
    BrowserSessionIsBrowserbaseRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionIsBrowserbaseParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionIsAdvancedStealthRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionIsAdvancedStealthParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionSetViewportSizeRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionSetViewportSizeParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionCloseRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        params:
          $ref: "#/components/schemas/BrowserSessionCloseParams"
      required:
        - sessionId
        - params
      additionalProperties: false
    BrowserSessionIsBrowserbaseResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionIsBrowserbaseAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionIsAdvancedStealthResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionIsAdvancedStealthAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionSetViewportSizeResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionSetViewportSizeAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionCloseResponse:
      type: object
      properties:
        success:
          type: boolean
          const: true
        error:
          type: "null"
        action:
          $ref: "#/components/schemas/BrowserSessionCloseAction"
      required:
        - success
        - error
        - action
      additionalProperties: false
    BrowserSessionActionIdParams:
      type: object
      properties:
        actionId:
          $ref: "#/components/schemas/ActionId"
      required:
        - actionId
      additionalProperties: false
    BrowserSessionActionDetailsQuery:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
      required:
        - sessionId
      additionalProperties: false
    BrowserSessionActionListQuery:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/BrowserSessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        method:
          $ref: "#/components/schemas/BrowserSessionActionMethod"
        status:
          $ref: "#/components/schemas/BrowserSessionActionStatus"
        limit:
          type: integer
          exclusiveMinimum: 0
          maximum: 500
      required:
        - sessionId
      additionalProperties: false
    ValidationErrorResponse:
      type: object
      properties:
        success:
          type: boolean
          const: false
        error:
          $ref: "#/components/schemas/PageError"
        statusCode:
          type: integer
          minimum: -9007199254740991
          maximum: 9007199254740991
        stack:
          anyOf:
            - type: string
            - type: "null"
        action:
          $ref: "#/components/schemas/PageAction"
      required:
        - success
        - error
        - statusCode
        - stack
      additionalProperties: false
    PageActionBase:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/ActionId"
        method:
          $ref: "#/components/schemas/PageActionMethod"
        status:
          $ref: "#/components/schemas/PageActionStatus"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        createdAt:
          $ref: "#/components/schemas/Timestamp"
        updatedAt:
          $ref: "#/components/schemas/Timestamp"
        completedAt:
          $ref: "#/components/schemas/Timestamp"
        error:
          anyOf:
            - $ref: "#/components/schemas/PageError"
            - type: "null"
      required:
        - id
        - method
        - status
        - sessionId
        - createdAt
        - updatedAt
        - error
      additionalProperties: false
    PageTargetIdRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageMainFrameIdRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageMainFrameRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageGetFullFrameTreeRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageAsProtocolFrameTreeRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        rootMainFrameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - sessionId
        - rootMainFrameId
      additionalProperties: false
    PageListAllFrameIdsRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageGetOrdinalRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        frameId:
          $ref: "#/components/schemas/FrameId"
      required:
        - sessionId
        - frameId
      additionalProperties: false
    PageTitleRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageUrlRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageFramesRequest:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
      required:
        - sessionId
      additionalProperties: false
    PageActionIdParams:
      type: object
      properties:
        actionId:
          $ref: "#/components/schemas/ActionId"
      required:
        - actionId
      additionalProperties: false
    PageActionDetailsQuery:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
      required:
        - sessionId
      additionalProperties: false
    PageActionListQuery:
      type: object
      properties:
        id:
          $ref: "#/components/schemas/RequestId"
        sessionId:
          $ref: "#/components/schemas/SessionId"
        pageId:
          $ref: "#/components/schemas/PageId"
        method:
          $ref: "#/components/schemas/PageActionMethod"
        status:
          $ref: "#/components/schemas/PageActionStatus"
        limit:
          type: integer
          exclusiveMinimum: 0
          maximum: 500
      required:
        - sessionId
      additionalProperties: false
paths:
  /v4/browsersession:
    post:
      operationId: BrowserSessionCreate
      summary: Create a browser session
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionCreateRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionErrorResponse"
  /v4/browsersession/{id}:
    get:
      operationId: BrowserSessionStatus
      summary: Get browser session status
      tags:
        - browserSession
      parameters:
        - schema:
            $ref: "#/components/schemas/BrowserSessionId"
          in: path
          name: id
          required: true
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionResponse"
  /v4/browsersession/{id}/end:
    post:
      operationId: BrowserSessionEnd
      summary: End a browser session
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              x-fastify-zod-openapi-optional: true
              $ref: "#/components/schemas/BrowserSessionEndRequest"
      parameters:
        - schema:
            $ref: "#/components/schemas/BrowserSessionId"
          in: path
          name: id
          required: true
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionResponse"
  /v4/browsersession/addInitScript:
    post:
      operationId: BrowserSessionAddInitScript
      summary: browserSession.addInitScript
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionAddInitScriptRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionAddInitScriptResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/setExtraHTTPHeaders:
    post:
      operationId: BrowserSessionSetExtraHTTPHeaders
      summary: browserSession.setExtraHTTPHeaders
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionSetExtraHTTPHeadersResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/pages:
    post:
      operationId: BrowserSessionPages
      summary: browserSession.pages
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionPagesRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionPagesResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/activePage:
    post:
      operationId: BrowserSessionActivePage
      summary: browserSession.activePage
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionActivePageRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionActivePageResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/awaitActivePage:
    post:
      operationId: BrowserSessionAwaitActivePage
      summary: browserSession.awaitActivePage
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionAwaitActivePageRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionAwaitActivePageResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/resolvePageByMainFrameId:
    post:
      operationId: BrowserSessionResolvePageByMainFrameId
      summary: browserSession.resolvePageByMainFrameId
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionResolvePageByMainFrameIdRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionResolvePageByMainFrameIdResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/getFullFrameTreeByMainFrameId:
    post:
      operationId: BrowserSessionGetFullFrameTreeByMainFrameId
      summary: browserSession.getFullFrameTreeByMainFrameId
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionGetFullFrameTreeByMainFrameIdRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionGetFullFrameTreeByMainFrameIdResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/newPage:
    post:
      operationId: BrowserSessionNewPage
      summary: browserSession.newPage
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionNewPageRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionNewPageResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/cookies:
    post:
      operationId: BrowserSessionCookies
      summary: browserSession.cookies
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionCookiesRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionCookiesResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/addCookies:
    post:
      operationId: BrowserSessionAddCookies
      summary: browserSession.addCookies
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionAddCookiesRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionAddCookiesResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/clearCookies:
    post:
      operationId: BrowserSessionClearCookies
      summary: browserSession.clearCookies
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionClearCookiesRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionClearCookiesResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/connectURL:
    post:
      operationId: BrowserSessionConnectURL
      summary: browserSession.connectURL
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionConnectURLRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionConnectURLResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/configuredViewport:
    post:
      operationId: BrowserSessionConfiguredViewport
      summary: browserSession.configuredViewport
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionConfiguredViewportRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionConfiguredViewportResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/browserbaseSessionID:
    post:
      operationId: BrowserSessionBrowserbaseSessionID
      summary: browserSession.browserbaseSessionID
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionIDResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/browserbaseSessionURL:
    post:
      operationId: BrowserSessionBrowserbaseSessionURL
      summary: browserSession.browserbaseSessionURL
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionBrowserbaseSessionURLResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/browserbaseDebugURL:
    post:
      operationId: BrowserSessionBrowserbaseDebugURL
      summary: browserSession.browserbaseDebugURL
      tags:
        - browserSession
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionBrowserbaseDebugURLResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/action:
    get:
      operationId: BrowserSessionActionList
      summary: browserSession.actions
      tags:
        - browserSession
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/BrowserSessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            $ref: "#/components/schemas/BrowserSessionActionMethod"
          in: query
          name: method
        - schema:
            $ref: "#/components/schemas/BrowserSessionActionStatus"
          in: query
          name: status
        - schema:
            type: integer
            exclusiveMinimum: 0
            maximum: 500
          in: query
          name: limit
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionActionListResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/browsersession/action/{actionId}:
    get:
      operationId: BrowserSessionActionDetails
      summary: browserSession.action
      tags:
        - browserSession
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/BrowserSessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/ActionId"
          in: path
          name: actionId
          required: true
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionActionDetailsResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/BrowserSessionV4ErrorResponse"
  /v4/page/click:
    post:
      operationId: PageClick
      summary: page.click
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageClickRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageClickResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/hover:
    post:
      operationId: PageHover
      summary: page.hover
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageHoverRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageHoverResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/scroll:
    post:
      operationId: PageScroll
      summary: page.scroll
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageScrollRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageScrollResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/dragAndDrop:
    post:
      operationId: PageDragAndDrop
      summary: page.dragAndDrop
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageDragAndDropRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageDragAndDropResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/type:
    post:
      operationId: PageType
      summary: page.type
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageTypeRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageTypeResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/keyPress:
    post:
      operationId: PageKeyPress
      summary: page.keyPress
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageKeyPressRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageKeyPressResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/goto:
    post:
      operationId: PageGoto
      summary: page.goto
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageGotoRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageGotoResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/reload:
    post:
      operationId: PageReload
      summary: page.reload
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageReloadRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageReloadResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/goBack:
    post:
      operationId: PageGoBack
      summary: page.goBack
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageGoBackRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageGoBackResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/goForward:
    post:
      operationId: PageGoForward
      summary: page.goForward
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageGoForwardRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageGoForwardResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/close:
    post:
      operationId: PageClose
      summary: page.close
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageCloseRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageCloseResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/enableCursorOverlay:
    post:
      operationId: PageEnableCursorOverlay
      summary: page.enableCursorOverlay
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageEnableCursorOverlayRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageEnableCursorOverlayResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/addInitScript:
    post:
      operationId: PageAddInitScript
      summary: page.addInitScript
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageAddInitScriptRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageAddInitScriptResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/targetId:
    get:
      operationId: PageTargetId
      summary: page.targetId
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageTargetIdResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/mainFrameId:
    get:
      operationId: PageMainFrameId
      summary: page.mainFrameId
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageMainFrameIdResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/mainFrame:
    get:
      operationId: PageMainFrame
      summary: page.mainFrame
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageMainFrameResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/getFullFrameTree:
    get:
      operationId: PageGetFullFrameTree
      summary: page.getFullFrameTree
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageGetFullFrameTreeResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/asProtocolFrameTree:
    get:
      operationId: PageAsProtocolFrameTree
      summary: page.asProtocolFrameTree
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            $ref: "#/components/schemas/FrameId"
          in: query
          name: rootMainFrameId
          required: true
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageAsProtocolFrameTreeResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/listAllFrameIds:
    get:
      operationId: PageListAllFrameIds
      summary: page.listAllFrameIds
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageListAllFrameIdsResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/getOrdinal:
    get:
      operationId: PageGetOrdinal
      summary: page.getOrdinal
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            $ref: "#/components/schemas/FrameId"
          in: query
          name: frameId
          required: true
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageGetOrdinalResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/title:
    get:
      operationId: PageTitle
      summary: page.title
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageTitleResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/url:
    get:
      operationId: PageUrl
      summary: page.url
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageUrlResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/frames:
    get:
      operationId: PageFrames
      summary: page.frames
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageFramesResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/setExtraHTTPHeaders:
    post:
      operationId: PageSetExtraHTTPHeaders
      summary: page.setExtraHTTPHeaders
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageSetExtraHTTPHeadersRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageSetExtraHTTPHeadersResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/waitForMainLoadState:
    post:
      operationId: PageWaitForMainLoadState
      summary: page.waitForMainLoadState
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageWaitForMainLoadStateRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageWaitForMainLoadStateResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/screenshot:
    post:
      operationId: PageScreenshot
      summary: page.screenshot
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageScreenshotRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageScreenshotResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/snapshot:
    post:
      operationId: PageSnapshot
      summary: page.snapshot
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageSnapshotRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageSnapshotResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/setViewportSize:
    post:
      operationId: PageSetViewportSize
      summary: page.setViewportSize
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageSetViewportSizeRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageSetViewportSizeResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/waitForLoadState:
    post:
      operationId: PageWaitForLoadState
      summary: page.waitForLoadState
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageWaitForLoadStateRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageWaitForLoadStateResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/waitForSelector:
    post:
      operationId: PageWaitForSelector
      summary: page.waitForSelector
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageWaitForSelectorRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageWaitForSelectorResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/waitForTimeout:
    post:
      operationId: PageWaitForTimeout
      summary: page.waitForTimeout
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageWaitForTimeoutRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageWaitForTimeoutResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/evaluate:
    post:
      operationId: PageEvaluate
      summary: page.evaluate
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageEvaluateRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageEvaluateResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/sendCDP:
    post:
      operationId: PageSendCDP
      summary: page.sendCDP
      tags:
        - page
      requestBody:
        content:
          application/json:
            schema:
              $ref: "#/components/schemas/PageSendCDPRequest"
        required: true
      parameters:
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageSendCDPResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/action:
    get:
      operationId: PageActionList
      summary: page.action
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/PageId"
          in: query
          name: pageId
        - schema:
            $ref: "#/components/schemas/PageActionMethod"
          in: query
          name: method
        - schema:
            $ref: "#/components/schemas/PageActionStatus"
          in: query
          name: status
        - schema:
            type: integer
            exclusiveMinimum: 0
            maximum: 500
          in: query
          name: limit
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageActionListResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
  /v4/page/action/{actionId}:
    get:
      operationId: PageActionDetails
      summary: page.actionById
      tags:
        - page
      parameters:
        - schema:
            $ref: "#/components/schemas/RequestId"
          in: query
          name: id
        - schema:
            $ref: "#/components/schemas/SessionId"
          in: query
          name: sessionId
          required: true
        - schema:
            $ref: "#/components/schemas/ActionId"
          in: path
          name: actionId
          required: true
        - schema:
            description: Whether to stream the response via SSE
            example: "true"
            type: string
            enum:
              - "true"
              - "false"
          in: header
          name: x-stream-response
          description: Whether to stream the response via SSE
      responses:
        "200":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/PageActionDetailsResponse"
        "400":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "401":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "404":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "408":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "422":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
        "500":
          description: Default Response
          content:
            application/json:
              schema:
                $ref: "#/components/schemas/V4ErrorResponse"
servers:
  - url: https://api.stagehand.browserbase.com
security:
  - BrowserbaseApiKey: []
    BrowserbaseProjectId: []
    ModelApiKey: []


================================================
FILE: packages/server-v4/package.json
================================================
{
  "name": "@browserbasehq/stagehand-server-v4",
  "version": "3.6.1",
  "description": "Stagehand API server v4",
  "type": "module",
  "private": true,
  "scripts": {
    "build": "pnpm --filter @browserbasehq/stagehand-server-v4 run --parallel \"/^(build:esm-tests|build:server:dist|gen:openapi|build:sea:esm)$/\"",
    "dev": "tsx watch src/server.ts",
    "build:esm-tests": "pnpm -w --dir ../.. exec tsc -p packages/server-v4/tsconfig.tests.json",
    "build:server:dist": "pnpm -w --dir ../.. exec tsc -p packages/server-v4/tsconfig.json && pnpm -w --dir ../.. exec tsc-alias -p packages/server-v4/tsconfig.json",
    "build:sea:esm": "tsx scripts/build-sea.ts --mode=esm",
    "build:sea:cjs": "tsx scripts/build-sea.ts --mode=cjs",
    "lint": "cd ../.. && prettier --check packages/server-v4 && cd packages/server-v4 && eslint . && pnpm run typecheck",
    "typecheck": "pnpm -w --dir ../.. exec tsc -p packages/server-v4/tsconfig.json --noEmit",
    "test": "pnpm -w --dir ../.. exec turbo run test:server --filter=@browserbasehq/stagehand-server-v4 --",
    "test:server": "tsx scripts/test-server.ts",
    "test:integration": "pnpm run test:server -- packages/server-v4/dist/tests/integration",
    "test:integration:local": "STAGEHAND_SERVER_TARGET=local pnpm run test:server -- packages/server-v4/dist/tests/integration",
    "test:integration:sea": "STAGEHAND_SERVER_TARGET=sea pnpm run test:server -- packages/server-v4/dist/tests/integration",
    "gen:openapi": "tsx scripts/gen-openapi.ts"
  },
  "dependencies": {
    "@browserbasehq/sdk": "^2.7.0",
    "@browserbasehq/stagehand": "workspace:*",
    "@fastify/cors": "^11.0.1",
    "@fastify/swagger": "^9.6.1",
    "@fastify/swagger-ui": "^5.2.3",
    "@t3-oss/env-core": "^0.13.8",
    "fastify": "^5.3.2",
    "fastify-metrics": "^12.1.0",
    "fastify-plugin": "^4.5.1",
    "fastify-zod-openapi": "^5.5.0",
    "http-status-codes": "^2.3.0",
    "pino": "^9.7.0",
    "pino-pretty": "^11.3.0",
    "playwright": "1.52.0",
    "uuid": "^11.0.5",
    "zod": "^4.2.1"
  },
  "devDependencies": {
    "@types/node": "22.13.1",
    "eslint": "10.0.2",
    "eslint-plugin-security": "^3.0.1",
    "openai": "4.87.1",
    "postject": "1.0.0-alpha.6",
    "prettier": "^3.2.5",
    "source-map": "^0.7.4",
    "tsc-alias": "^1.8.10",
    "tsx": "*",
    "vitest": "^4.0.8"
  },
  "repository": {
    "type": "git",
    "url": "git+https://github.com/browserbase/stagehand.git",
    "directory": "packages/server-v4"
  },
  "bugs": {
    "url": "https://github.com/browserbase/stagehand/issues"
  },
  "homepage": "https://stagehand.dev"
}


================================================
FILE: packages/server-v4/scripts/build-sea.ts
================================================
#!/usr/bin/env node
/**
 * Build SEA binary from ESM (test) or CJS (release) bundles.
 *
 * Prereqs:
 * - CJS mode: runs core CJS build via Turbo if dist is missing.
 * - ESM mode: core dist/esm available (pnpm run build:esm).
 * - postject installed; tar available for non-Windows downloads.
 *
 * Args: --mode=esm|cjs --target-platform=<platform> --target-arch=<arch> --binary-name=<name>
 * Env: SEA_BUILD_MODE, SEA_TARGET_PLATFORM, SEA_TARGET_ARCH, SEA_BINARY_NAME,
 *      SEA_INCLUDE_SOURCEMAPS.
 * Example: pnpm run build:sea:cjs -- --target-platform=linux --target-arch=arm64
 */
import { spawnSync } from "node:child_process";
import { createHash } from "node:crypto";
import fs from "node:fs";
import os from "node:os";
import path from "node:path";
import https from "node:https";
import { pathToFileURL } from "node:url";
import esbuild from "esbuild";
import { getRepoRootDir } from "./runtimePaths.js";

const repoDir = getRepoRootDir();

const argValue = (name: string) => {
  const prefix = `--${name}=`;
  for (let i = 0; i < process.argv.length; i++) {
    const arg = process.argv[i];
    if (arg === `--${name}` && process.argv[i + 1]) return process.argv[i + 1];
    if (arg.startsWith(prefix)) return arg.slice(prefix.length);
  }
  return undefined;
};

const mode = (
  argValue("mode") ??
  process.env.SEA_BUILD_MODE ??
  "esm"
).toLowerCase();
const parseBoolean = (
  value: string | undefined,
  fallback: boolean,
): boolean => {
  if (value === undefined) return fallback;

  const normalized = value.toLowerCase();
  if (
    normalized === "1" ||
    normalized === "true" ||
    normalized === "yes" ||
    normalized === "on"
  ) {
    return true;
  }
  if (
    normalized === "0" ||
    normalized === "false" ||
    normalized === "no" ||
    normalized === "off"
  ) {
    return false;
  }

  throw new Error(
    `Invalid boolean value "${value}" for --include-sourcemaps / SEA_INCLUDE_SOURCEMAPS`,
  );
};
const targetPlatform =
  argValue("target-platform") ??
  argValue("platform") ??
  process.env.SEA_TARGET_PLATFORM ??
  process.platform;
const targetArch =
  argValue("target-arch") ??
  argValue("arch") ??
  process.env.SEA_TARGET_ARCH ??
  process.arch;
const binaryName =
  argValue("binary-name") ??
  process.env.SEA_BINARY_NAME ??
  `stagehand-server-v4-${targetPlatform}-${targetArch}${targetPlatform === "win32" ? ".exe" : ""}`;
const includeSourcemaps = parseBoolean(
  argValue("include-sourcemaps") ?? process.env.SEA_INCLUDE_SOURCEMAPS,
  false,
);

const run = (cmd: string, args: string[], opts: { cwd?: string } = {}) => {
  const result = spawnSync(cmd, args, { stdio: "inherit", ...opts });
  if (result.error) {
    throw new Error(
      `Command failed to start: ${cmd} ${args.join(" ")}\n${String(result.error)}`,
    );
  }
  if (result.status !== 0) {
    throw new Error(`Command failed: ${cmd} ${args.join(" ")}`);
  }
};

const runNodeScript = (
  scriptPath: string,
  args: string[],
  opts: { cwd?: string } = {},
) => run(process.execPath, [scriptPath, ...args], opts);

const resolveFirstExisting = (paths: string[]): string => {
  for (const candidate of paths) {
    if (fs.existsSync(candidate)) return candidate;
  }
  throw new Error(`Missing tool script. Tried: ${paths.join(", ")}`);
};

const runOptional = (
  cmd: string,
  args: string[],
  opts: { cwd?: string } = {},
) => {
  spawnSync(cmd, args, { stdio: "ignore", ...opts });
};

const download = (url: string, dest: string): Promise<void> =>
  new Promise((resolve, reject) => {
    https
      .get(url, (res) => {
        if (res.statusCode && res.statusCode >= 300 && res.statusCode < 400) {
          const location = res.headers.location;
          if (!location) {
            reject(new Error(`Redirect without location: ${url}`));
            return;
          }
          res.resume();
          download(location, dest).then(resolve, reject);
          return;
        }
        if (res.statusCode !== 200) {
          reject(new Error(`Download failed (${res.statusCode}) ${url}`));
          res.resume();
          return;
        }

        const file = fs.createWriteStream(dest);
        const fail = (error: Error) => {
          file.destroy();
          reject(error);
        };

        res.on("error", fail);
        file.on("error", fail);
        file.on("finish", () => {
          file.close((closeError) => {
            if (closeError) {
              reject(closeError);
              return;
            }
            resolve();
          });
        });
        res.pipe(file);
      })
      .on("error", reject);
  });

const resolveNodeBinary = async (): Promise<string> => {
  if (targetPlatform !== process.platform) {
    throw new Error(
      `Cross-platform builds are not supported. Host=${process.platform}, target=${targetPlatform}`,
    );
  }
  if (targetArch === process.arch) {
    return process.execPath;
  }

  const version = process.version;
  const distPlatform = targetPlatform === "win32" ? "win" : targetPlatform;
  const archiveBase = `node-${version}-${distPlatform}-${targetArch}`;
  const archiveExt = distPlatform === "win" ? "zip" : "tar.xz";
  const tmpRoot = `${os.tmpdir()}/stagehand-sea/${archiveBase}`;
  const archivePath = `${tmpRoot}/${archiveBase}.${archiveExt}`;
  const extractRoot = `${tmpRoot}/${archiveBase}`;
  const binaryPath =
    distPlatform === "win"
      ? `${extractRoot}/node.exe`
      : `${extractRoot}/bin/node`;

  if (fs.existsSync(binaryPath)) {
    return binaryPath;
  }

  fs.mkdirSync(tmpRoot, { recursive: true });
  if (!fs.existsSync(archivePath)) {
    const url = `https://nodejs.org/dist/${version}/${archiveBase}.${archiveExt}`;
    await download(url, archivePath);
  }

  if (archiveExt === "zip") {
    if (process.platform !== "win32") {
      throw new Error("Windows binaries must be built on Windows runners.");
    }
    run("powershell", [
      "-Command",
      `Expand-Archive -Path '${archivePath}' -DestinationPath '${tmpRoot}' -Force`,
    ]);
  } else {
    run("tar", ["-xf", archivePath, "-C", tmpRoot]);
  }

  if (!fs.existsSync(binaryPath)) {
    throw new Error(`Missing Node binary at ${binaryPath}`);
  }
  return binaryPath;
};

const writeSeaConfig = (
  mainPath: string,
  outputPath: string,
  execArgvExtension?: string,
) => {
  const configPath = `${repoDir}/packages/server-v4/dist/sea/sea-config-${mode}.json`;
  const config = {
    main: path
      .relative(`${repoDir}/packages/server-v4`, mainPath)
      .replaceAll("\\", "/"),
    output: path
      .relative(`${repoDir}/packages/server-v4`, outputPath)
      .replaceAll("\\", "/"),
    ...(execArgvExtension ? { execArgvExtension } : {}),
  };
  fs.writeFileSync(configPath, JSON.stringify(config, null, 2));
  return configPath;
};

const buildCjsBundle = () => {
  const turboBin = resolveFirstExisting([
    `${repoDir}/node_modules/turbo/bin/turbo`,
  ]);
  runNodeScript(
    turboBin,
    ["run", "build:cjs", "--filter", "@browserbasehq/stagehand"],
    {
      cwd: repoDir,
    },
  );
  fs.mkdirSync(`${repoDir}/packages/server-v4/dist/sea`, { recursive: true });
  const bundlePath = `${repoDir}/packages/server-v4/dist/sea/bundle.cjs`;
  esbuild.buildSync({
    entryPoints: ["packages/server-v4/src/sea-entry.ts"],
    bundle: true,
    platform: "node",
    format: "cjs",
    outfile: bundlePath,
    logLevel: "warning",
    absWorkingDir: repoDir,
  });
  return bundlePath;
};

const buildEsmBundle = () => {
  if (!fs.existsSync(`${repoDir}/packages/core/dist/esm/index.js`)) {
    throw new Error(
      `Missing ${repoDir}/packages/core/dist/esm/index.js. Run pnpm run build:esm first.`,
    );
  }

  fs.mkdirSync(`${repoDir}/packages/server-v4/dist/sea`, { recursive: true });
  const appBundlePath = `${repoDir}/packages/server-v4/dist/app.mjs`;
  esbuild.buildSync({
    entryPoints: ["packages/server-v4/src/sea-entry.ts"],
    bundle: true,
    platform: "node",
    format: "esm",
    treeShaking: false,
    outfile: appBundlePath,
    alias: {
      "@browserbasehq/stagehand": `${repoDir}/packages/core/dist/esm/index.js`,
    },
    sourcemap: includeSourcemaps ? "inline" : false,
    sourcesContent: includeSourcemaps,
    ...(includeSourcemaps ? { sourceRoot: repoDir } : {}),
    banner: {
      js: 'import { createRequire as __createRequire } from "node:module"; const require = __createRequire(import.meta.url);',
    },
    logLevel: "warning",
    absWorkingDir: repoDir,
  });

  const appSource = fs.readFileSync(appBundlePath, "utf8");
  let finalAppSource = appSource;

  if (includeSourcemaps) {
    const mapMatch = appSource.match(
      /sourceMappingURL=data:application\/json;base64,([A-Za-z0-9+/=]+)\s*$/,
    );
    if (!mapMatch) {
      throw new Error("Missing inline sourcemap in dist/app.mjs");
    }
    const mapJson = Buffer.from(mapMatch[1], "base64").toString("utf8");
    const map = JSON.parse(mapJson) as {
      sourceRoot?: string;
      sources: string[];
      sourcesContent?: string[];
    };
    const toPosix = (value: string) => value.replaceAll("\\", "/");
    const fileUrlToPathSafe = (value: string) => {
      const parsed = new URL(value);
      let pathname = decodeURIComponent(parsed.pathname);
      if (/^\/[A-Za-z]:/.test(pathname)) {
        pathname = pathname.slice(1);
      }
      return pathname;
    };
    const toRepoRelative = (source: string) => {
      let sourcePath = source;
      if (source.startsWith("file://")) {
        sourcePath = fileUrlToPathSafe(source);
      }

      if (path.isAbsolute(sourcePath)) {
        const normalizedSourcePath = toPosix(sourcePath);
        if (normalizedSourcePath.startsWith(`${repoDir}/`)) {
          return toPosix(path.relative(repoDir, normalizedSourcePath));
        }
        return normalizedSourcePath;
      }

      if (sourcePath.startsWith("../src/")) {
        const rel = sourcePath.slice("../src/".length);
        return `packages/server-v4/src/${rel}`;
      }
      if (sourcePath.startsWith("../../core/")) {
        const rel = sourcePath.slice("../../core/".length);
        return `packages/core/${rel}`;
      }
      if (sourcePath.startsWith("../../../node_modules/")) {
        const rel = sourcePath.slice("../../../node_modules/".length);
        return `node_modules/${rel}`;
      }
      if (sourcePath.startsWith("src/")) {
        const rel = sourcePath.slice("src/".length);
        return `packages/server-v4/src/${rel}`;
      }
      if (sourcePath.startsWith("../node_modules/")) {
        const rel = sourcePath.slice("../node_modules/".length);
        return `node_modules/${rel}`;
      }
      if (sourcePath.startsWith("../core/")) {
        const rel = sourcePath.slice("../core/".length);
        return `packages/core/${rel}`;
      }
      if (sourcePath.startsWith("core/")) {
        return `packages/core/${sourcePath.slice("core/".length)}`;
      }
      if (
        sourcePath.startsWith("packages/") ||
        sourcePath.startsWith("node_modules/")
      ) {
        return toPosix(sourcePath);
      }

      const resolved = toPosix(
        path.resolve(`${repoDir}/packages/server-v4`, sourcePath),
      );
      if (resolved.startsWith(`${repoDir}/`)) {
        return toPosix(path.relative(repoDir, resolved));
      }

      return toPosix(sourcePath);
    };

    map.sourceRoot = pathToFileURL(`${repoDir}/`).href;
    map.sources = map.sources.map(toRepoRelative);
    const updatedMap = Buffer.from(JSON.stringify(map)).toString("base64");
    finalAppSource = appSource.replace(mapMatch[1], updatedMap);
    fs.writeFileSync(appBundlePath, finalAppSource);
  }

  const appBytes = Buffer.from(finalAppSource);
  const bundleHash = createHash("sha256")
    .update(appBytes)
    .digest("hex")
    .slice(0, 12);
  const bootstrapPath = `${repoDir}/packages/server-v4/dist/sea/sea-bootstrap.cjs`;
  const bootstrap = `/* eslint-disable */
const fs = require("node:fs");
const os = require("node:os");
const { pathToFileURL } = require("node:url");

const bundleBase64 = ${JSON.stringify(appBytes.toString("base64"))};
const bundleLength = ${appBytes.length};
const bundleHash = ${JSON.stringify(bundleHash)};

const cacheRoot =
  process.env.STAGEHAND_SEA_CACHE_DIR ||
  \`\${os.tmpdir()}/stagehand-server-v4-sea\`;
const cacheDir = \`\${cacheRoot}/\${bundleHash}\`;
const appPath = \`\${cacheDir}/app.mjs\`;

fs.mkdirSync(cacheDir, { recursive: true });
let needsWrite = true;
try {
  const stat = fs.statSync(appPath);
  needsWrite = stat.size !== bundleLength;
} catch {}

if (needsWrite) {
  const tmpPath =
    \`\${cacheDir}/app.mjs.tmp-\${process.pid}-\${Date.now().toString(16)}\`;
  fs.writeFileSync(tmpPath, Buffer.from(bundleBase64, "base64"));
  try {
    fs.renameSync(tmpPath, appPath);
  } catch (err) {
    if (!fs.existsSync(appPath)) throw err;
  }
  try {
    fs.chmodSync(appPath, 0o500);
  } catch {}
}

(async () => {
  await import(pathToFileURL(appPath).href);
})().catch((err) => {
  console.error(err);
  process.exitCode = 1;
});
`;
  fs.writeFileSync(bootstrapPath, bootstrap);
  return bootstrapPath;
};

const main = async () => {
  fs.mkdirSync(`${repoDir}/packages/server-v4/dist/sea`, { recursive: true });

  let mainPath: string;
  let execArgvExtension: string | undefined;

  if (mode === "cjs") {
    mainPath = buildCjsBundle();
  } else if (mode === "esm") {
    mainPath = buildEsmBundle();
    execArgvExtension = "cli";
  } else {
    throw new Error(`Unknown SEA build mode: ${mode}`);
  }

  const seaConfigPath = writeSeaConfig(
    mainPath,
    `${repoDir}/packages/server-v4/dist/sea/sea-prep.blob`,
    execArgvExtension,
  );

  run("node", ["--experimental-sea-config", seaConfigPath], {
    cwd: `${repoDir}/packages/server-v4`,
  });
  if (!fs.existsSync(`${repoDir}/packages/server-v4/dist/sea/sea-prep.blob`)) {
    throw new Error(
      `Missing ${repoDir}/packages/server-v4/dist/sea/sea-prep.blob; SEA blob generation failed.`,
    );
  }

  const nodeBinary = await resolveNodeBinary();
  const outPath = `${repoDir}/packages/server-v4/dist/sea/${binaryName}`;
  fs.copyFileSync(nodeBinary, outPath);
  if (targetPlatform !== "win32") {
    fs.chmodSync(outPath, 0o755);
  }

  if (targetPlatform === "darwin") {
    runOptional("codesign", ["--remove-signature", outPath]);
  }

  const postjectCliPath = resolveFirstExisting([
    `${repoDir}/packages/server-v4/node_modules/postject/dist/cli.js`,
    `${repoDir}/node_modules/postject/dist/cli.js`,
  ]);
  const postjectArgs = [
    outPath,
    "NODE_SEA_BLOB",
    `${repoDir}/packages/server-v4/dist/sea/sea-prep.blob`,
    "--sentinel-fuse",
    "NODE_SEA_FUSE_fce680ab2cc467b6e072b8b5df1996b2",
  ];
  if (targetPlatform === "darwin") {
    postjectArgs.push("--macho-segment-name", "NODE_SEA");
  }
  runNodeScript(postjectCliPath, postjectArgs, {
    cwd: `${repoDir}/packages/server-v4`,
  });

  if (targetPlatform === "darwin") {
    runOptional("codesign", ["--sign", "-", outPath]);
  }
};

main().catch((err) => {
  console.error(err instanceof Error ? err.message : String(err));
  process.exit(1);
});


================================================
FILE: packages/server-v4/scripts/gen-openapi.ts
================================================
import { writeFile } from "node:fs/promises";
import path from "node:path";
import { getCurrentDirPath } from "./runtimePaths.js";

import fastify from "fastify";
import fastifySwagger from "@fastify/swagger";
import {
  fastifyZodOpenApiPlugin,
  fastifyZodOpenApiTransformers,
  serializerCompiler,
  validatorCompiler,
  type FastifyZodOpenApiTypeProvider,
} from "fastify-zod-openapi";
import { Api } from "@browserbasehq/stagehand";
import { browserSessionOpenApiComponents } from "../src/schemas/v4/browserSession.js";
import { pageOpenApiComponents } from "../src/schemas/v4/page.js";
import { browserSessionRoutes } from "../src/routes/v4/browsersession/routes.js";
import { pageRoutes } from "../src/routes/v4/page/routes.js";

// Routes
import healthcheckRoute from "../src/routes/healthcheck.js";
import readinessRoute from "../src/routes/readiness.js";

const OUTPUT_PATH = path.resolve(getCurrentDirPath(), "../openapi.v4.yaml");

async function main() {
  const app = fastify({
    logger: false,
  }).withTypeProvider<FastifyZodOpenApiTypeProvider>();

  app.setValidatorCompiler(validatorCompiler);
  app.setSerializerCompiler(serializerCompiler);

  // Register all API schemas as components so fastify-zod-openapi can create $ref links
  const components = {
    schemas: {
      ...browserSessionOpenApiComponents.schemas,
      ...pageOpenApiComponents.schemas,
    },
  };

  await app.register(fastifyZodOpenApiPlugin, { components });

  await app.register(fastifySwagger, {
    openapi: {
      info: {
        title: "Stagehand API v4",
        version: "4.0.0",
        description: `Stagehand SDK for AI browser automation [ALPHA]. This API allows clients to
execute browser automation tasks remotely on the Browserbase cloud.
Create a browser session with /browsersession, then use that id with page routes.
Responses are streamed using Server-Sent Events (SSE) when the
\`x-stream-response: true\` header is provided.

This SDK is currently ALPHA software and is not production ready!
Please try it and give us your feedback, stay tuned for upcoming release announcements!`,
        contact: {
          name: "Browserbase",
          url: "https://browserbase.com",
        },
      },
      openapi: "3.1.0",
      servers: [
        {
          url: "https://api.stagehand.browserbase.com",
        },
      ],
      components: {
        securitySchemes: Api.openApiSecuritySchemes,
        links: Api.openApiLinks,
      },
      security: [
        { BrowserbaseApiKey: [], BrowserbaseProjectId: [], ModelApiKey: [] },
      ],
    },
    ...fastifyZodOpenApiTransformers,
  });

  await app.register(
    (instance, _opts, done) => {
      for (const route of browserSessionRoutes) {
        instance.route(route);
      }
      for (const route of pageRoutes) {
        instance.route(route);
      }
      done();
    },
    { prefix: "/v4" },
  );

  app.route(healthcheckRoute);
  app.route(readinessRoute);

  await app.ready();

  const yaml = app.swagger({ yaml: true });
  // Mintlify expects OpenAPI version fields to be strings, so quote them here.
  const fixedYaml = yaml
    .replace(/^openapi:\s*(?!['"])([^#\s]+)\s*$/m, 'openapi: "$1"')
    .replace(/^ {2}version:\s*(?!['"])([^#\s]+)\s*$/m, '  version: "$1"')
    .replace(
      "description: Wait for captcha solves (deprecated, v2 only)",
      "description: Wait for captcha solves",
    )
    .replace(
      "description: Timeout in ms for act operations (deprecated, v2 only)",
      "description: Timeout in ms for act operations",
    );

  await writeFile(OUTPUT_PATH, fixedYaml, "utf8");

  await app.close();
  console.log(`OpenAPI spec written to ${OUTPUT_PATH}`);
}

main().catch((err) => {
  console.error(err);
  process.exit(1);
});


================================================
FILE: packages/server-v4/scripts/runtimePaths.ts
================================================
/**
 * Keep this file in sync with:
 * - /packages/core/lib/v3/runtimePaths.ts
 * - /packages/server-v4/scripts/runtimePaths.ts
 * - /packages/evals/runtimePaths.ts
 * - /packages/docs/scripts/runtimePaths.js
 */
import path from "node:path";
import { fileURLToPath } from "node:url";
import { createRequire } from "node:module";

const PACKAGE_SEGMENT = "/packages/server-v4/";
const EVAL_FRAMES = new Set(["[eval]", "[eval]-wrapper"]);
const INTERNAL_FRAME_NAMES = new Set([
  "readCallsites",
  "readCallsitePath",
  "resolveCallerFilePath",
  "getCurrentFilePath",
  "getCurrentDirPath",
  "getRepoRootDir",
  "getPackageRootDir",
  "createRequireFromCaller",
  "isMainModule",
]);

const normalizePath = (value: string): string => {
  const input = value.startsWith("file://") ? fileURLToPath(value) : value;
  return path.resolve(input).replaceAll("\\", "/");
};

const readCallsites = (): NodeJS.CallSite[] => {
  const previousPrepare = Error.prepareStackTrace;
  try {
    Error.prepareStackTrace = (_, stack) => stack;
    return (
      (new Error().stack as unknown as NodeJS.CallSite[] | undefined) ?? []
    );
  } finally {
    Error.prepareStackTrace = previousPrepare;
  }
};

type CallSiteWithScriptName = NodeJS.CallSite & {
  getScriptNameOrSourceURL?: () => string | null;
};

const readCallsitePath = (callsite: NodeJS.CallSite): string | null => {
  const callsiteWithScript = callsite as CallSiteWithScriptName;
  const rawPath =
    callsite.getFileName() ?? callsiteWithScript.getScriptNameOrSourceURL?.();
  if (!rawPath) return null;
  if (rawPath.startsWith("node:")) return null;
  if (EVAL_FRAMES.has(rawPath)) return null;
  return normalizePath(rawPath);
};

const isInternalCallsite = (callsite: NodeJS.CallSite): boolean => {
  const functionName = callsite.getFunctionName();
  if (functionName && INTERNAL_FRAME_NAMES.has(functionName)) return true;

  const methodName = callsite.getMethodName();
  if (methodName && INTERNAL_FRAME_NAMES.has(methodName)) return true;

  const callsiteString = callsite.toString();
  for (const frameName of INTERNAL_FRAME_NAMES) {
    if (callsiteString.includes(`${frameName} (`)) return true;
    if (callsiteString.includes(`.${frameName} (`)) return true;
  }
  return false;
};

const resolveCallerFilePath = (): string => {
  const packageCandidates: string[] = [];
  const fallbackCandidates: string[] = [];

  for (const callsite of readCallsites()) {
    const filePath = readCallsitePath(callsite);
    if (!filePath) continue;
    if (isInternalCallsite(callsite)) continue;
    if (filePath.includes(PACKAGE_SEGMENT)) {
      packageCandidates.push(filePath);
      continue;
    }
    fallbackCandidates.push(filePath);
  }

  const packageCandidate = packageCandidates[0];
  if (packageCandidate) return packageCandidate;

  const fallbackCandidate = fallbackCandidates[0];
  if (fallbackCandidate) return fallbackCandidate;

  throw new Error("Unable to resolve caller file path.");
};

export const getCurrentFilePath = (): string => resolveCallerFilePath();

export const getCurrentDirPath = (): string =>
  path.dirname(getCurrentFilePath());

export const getRepoRootDir = (): string => {
  const currentFilePath = getCurrentFilePath();
  const index = currentFilePath.lastIndexOf(PACKAGE_SEGMENT);
  if (index === -1) {
    throw new Error(
      `Unable to determine repo root from ${currentFilePath} (missing ${PACKAGE_SEGMENT}).`,
    );
  }
  return currentFilePath.slice(0, index);
};

export const getPackageRootDir = (): string =>
  `${getRepoRootDir()}${PACKAGE_SEGMENT.slice(0, -1)}`;

export const createRequireFromCaller = () =>
  createRequire(getCurrentFilePath());

export const isMainModule = (): boolean => {
  const entryScript = process.argv.at(1);
  if (!entryScript) return false;
  return normalizePath(entryScript) === getCurrentFilePath();
};


================================================
FILE: packages/server-v4/scripts/test-server.ts
================================================
/**
 * Server unit + integration tests on dist/esm + SEA/local server targets.
 *
 * Prereqs:
 * - pnpm run build (packages/server-v4/dist/tests + packages/server-v4/dist/server.js).
 * - SEA integration still requires build:sea when STAGEHAND_SERVER_TARGET=sea.
 *
 * Args: [test paths...] -- [node --test args...] | --list (prints JSON matrix)
 * Env: STAGEHAND_SERVER_TARGET=sea|local|remote, STAGEHAND_BASE_URL, SEA_BINARY_NAME,
 *      NODE_TEST_CONSOLE_REPORTER, NODE_TEST_REPORTER, NODE_TEST_REPORTER_DESTINATION,
 *      NODE_V8_COVERAGE; writes CTRF to ctrf/node-test-*.xml by default.
 * Example: STAGEHAND_SERVER_TARGET=sea pnpm run test:server -- packages/server-v4/dist/tests/integration/v4/start.test.js
 */
import fs from "node:fs";
import path from "node:path";
import { spawn, spawnSync } from "node:child_process";
import { getRepoRootDir } from "./runtimePaths.js";

const ensureParentDir = (filePath: string) => {
  fs.mkdirSync(path.dirname(filePath), { recursive: true });
};

const splitArgs = (args: string[]) => {
  const tokens = [...args];
  while (tokens[0] === "--") {
    tokens.shift();
  }

  const leadingExtra: string[] = [];
  while (tokens.length > 0 && tokens[0].startsWith("-")) {
    const arg = tokens.shift();
    if (!arg) break;
    if (arg === "--") break;
    leadingExtra.push(arg);
    if (
      !arg.includes("=") &&
      tokens[0] &&
      tokens[0] !== "--" &&
      !tokens[0].startsWith("-")
    ) {
      leadingExtra.push(tokens.shift() as string);
    }
  }

  while (tokens[0] === "--") {
    tokens.shift();
  }

  const separatorIndex = tokens.indexOf("--");
  return {
    paths: separatorIndex === -1 ? tokens : tokens.slice(0, separatorIndex),
    extra: [
      ...leadingExtra,
      ...(separatorIndex === -1 ? [] : tokens.slice(separatorIndex + 1)),
    ],
  };
};

const toSafeName = (name: string) => name.replace(/[\\/]/g, "-");

const collectFiles = (dir: string, suffix: string) => {
  const results: string[] = [];
  const walk = (current: string) => {
    for (const entry of fs.readdirSync(current, { withFileTypes: true })) {
      const full = `${current}/${entry.name}`;
      if (entry.isDirectory()) {
        walk(full);
      } else if (entry.isFile() && entry.name.endsWith(suffix)) {
        results.push(full);
      }
    }
  };
  if (fs.existsSync(dir)) walk(dir);
  return results.sort();
};

const repoRoot = getRepoRootDir();

const writeCtrfFromJunit = (junitPath: string, tool: string) => {
  if (!fs.existsSync(junitPath)) return;
  const stat = fs.statSync(junitPath);
  if (stat.size === 0) return;
  const ctrfPath = junitPath.match(/\.xml$/i)
    ? junitPath.replace(/\.xml$/i, ".json")
    : `${junitPath}.json`;
  const result = spawnSync(
    "pnpm",
    ["exec", "junit-to-ctrf", junitPath, "-o", ctrfPath, "-t", tool],
    { stdio: "inherit", cwd: repoRoot },
  );
  if (result.status !== 0) {
    console.warn(`CTRF conversion failed for ${junitPath}.`);
  }
};

const sourceTestsDir = `${repoRoot}/packages/server-v4/test`;
const sourceUnitDir = `${sourceTestsDir}/unit`;
const sourceIntegrationDir = `${sourceTestsDir}/integration`;
const unitDir = `${repoRoot}/packages/server-v4/dist/tests/unit`;
const integrationDir = `${repoRoot}/packages/server-v4/dist/tests/integration`;
const allTestsDir = `${repoRoot}/packages/server-v4/dist/tests`;

const resolveRepoRelative = (value: string) =>
  path.isAbsolute(value) ? value : path.resolve(repoRoot, value);

const stripNodeReporterArgs = (argsList: string[]) => {
  const filtered: string[] = [];
  let removed = false;
  for (let i = 0; i < argsList.length; i++) {
    const arg = argsList[i];
    if (
      arg === "--test-reporter" ||
      arg.startsWith("--test-reporter=") ||
      arg === "--test-reporter-destination" ||
      arg.startsWith("--test-reporter-destination=")
    ) {
      removed = true;
      if (
        (arg === "--test-reporter" || arg === "--test-reporter-destination") &&
        argsList[i + 1]
      ) {
        i += 1;
      }
      continue;
    }
    filtered.push(arg);
  }
  return { filtered, removed };
};

const toTestName = (testPath: string, root: string) => {
  const abs = resolveRepoRelative(testPath);
  const rel = path.relative(root, abs).replaceAll("\\", "/");
  if (!rel.startsWith("..")) {
    return rel.replace(/\.test\.js$/i, "");
  }
  return path.basename(abs).replace(/\.test\.js$/i, "");
};

const rawArgs = process.argv.slice(2);
const listRequested = rawArgs.includes("--list");

if (listRequested) {
  const unitTests = collectFiles(sourceUnitDir, ".test.ts").map((file) => {
    const relSource = path.relative(sourceTestsDir, file).replaceAll("\\", "/");
    const distPath = `${repoRoot}/packages/server-v4/dist/tests/${relSource.replace(/\.test\.ts$/, ".test.js")}`;
    const name = path.basename(file, ".test.ts");
    return {
      path: path.relative(repoRoot, distPath).replaceAll("\\", "/"),
      name,
      safe_name: toSafeName(name),
    };
  });
  const integrationTests = collectFiles(sourceIntegrationDir, ".test.ts").map(
    (file) => {
      const relSource = path
        .relative(sourceTestsDir, file)
        .replaceAll("\\", "/");
      const distPath = `${repoRoot}/packages/server-v4/dist/tests/${relSource.replace(/\.test\.ts$/, ".test.js")}`;
      const rel = path
        .relative(sourceIntegrationDir, file)
        .replaceAll("\\", "/")
        .replace(/\.test\.ts$/, "");
      return {
        path: path.relative(repoRoot, distPath).replaceAll("\\", "/"),
        name: rel,
        safe_name: toSafeName(rel),
      };
    },
  );
  console.log(JSON.stringify([...unitTests, ...integrationTests]));
  process.exit(0);
}

const { paths, extra } = splitArgs(rawArgs);
const { filtered: extraArgs, removed: removedReporterOverride } =
  stripNodeReporterArgs(extra);
if (removedReporterOverride) {
  console.warn(
    "Ignoring node --test reporter overrides to preserve console + JUnit output.",
  );
}

if (!fs.existsSync(allTestsDir)) {
  console.error(
    "Missing packages/server-v4/dist/tests. Run pnpm run build first.",
  );
  process.exit(1);
}

const serverTarget = (
  process.env.STAGEHAND_SERVER_TARGET ?? "sea"
).toLowerCase();
const explicitBaseUrl = process.env.STAGEHAND_BASE_URL;
const baseUrl = explicitBaseUrl ?? "http://stagehand-api.localhost:3107";

if (serverTarget === "remote" && !explicitBaseUrl) {
  console.error("Missing STAGEHAND_BASE_URL for remote server target.");
  process.exit(1);
}

if (
  serverTarget === "local" &&
  !fs.existsSync(`${repoRoot}/packages/server-v4/dist/server.js`)
) {
  console.error(
    "Missing packages/server-v4/dist/server.js. Run pnpm run build first.",
  );
  process.exit(1);
}

const parsedBaseUrl = new URL(baseUrl);
const port =
  parsedBaseUrl.port || (parsedBaseUrl.protocol === "https:" ? "443" : "80");

process.env.PORT = port;
process.env.STAGEHAND_API_URL = baseUrl;
process.env.BB_ENV = process.env.BB_ENV ?? "local";

const baseNodeOptions = "--enable-source-maps";
const nodeOptions = [process.env.NODE_OPTIONS, baseNodeOptions]
  .filter(Boolean)
  .join(" ");

const allPaths =
  paths.length > 0
    ? paths.map(resolveRepoRelative)
    : [
        ...collectFiles(unitDir, ".test.js"),
        ...collectFiles(integrationDir, ".test.js"),
      ];

const unitPaths = allPaths.filter((p) =>
  p.replaceAll("\\", "/").includes("/packages/server-v4/dist/tests/unit/"),
);
const integrationPaths = allPaths.filter((p) =>
  p
    .replaceAll("\\", "/")
    .includes("/packages/server-v4/dist/tests/integration/"),
);

const singlePath = allPaths.length === 1 ? allPaths[0] : null;
const coverageSuffix =
  singlePath &&
  singlePath.startsWith(`${repoRoot}/packages/server-v4/dist/tests/unit/`)
    ? `server-unit/${path.basename(singlePath).replace(/\.test\.js$/, "")}`
    : singlePath &&
        singlePath.startsWith(
          `${repoRoot}/packages/server-v4/dist/tests/integration/`,
        )
      ? `server-integration/${path
          .relative(integrationDir, singlePath)
          .replace(/\.test\.js$/, "")
          .replaceAll("\\", "/")}`
      : "server";

const coverageRoot = resolveRepoRelative(
  process.env.NODE_V8_COVERAGE ?? `${repoRoot}/coverage/${coverageSuffix}`,
);
const testsCoverage = `${coverageRoot}/tests`;
const serverCoverage = `${coverageRoot}/server`;
fs.mkdirSync(testsCoverage, { recursive: true });
fs.mkdirSync(serverCoverage, { recursive: true });

const consoleReporter = process.env.NODE_TEST_CONSOLE_REPORTER ?? "spec";
const defaultReporter = process.env.NODE_TEST_REPORTER ?? "junit";
const envDestination = process.env.NODE_TEST_REPORTER_DESTINATION
  ? resolveRepoRelative(process.env.NODE_TEST_REPORTER_DESTINATION)
  : null;

const reporterArgsFor = (kind: "unit" | "integration", testName?: string) => {
  const destination =
    envDestination ??
    `${repoRoot}/ctrf/${kind === "unit" ? "server-unit" : "server-integration"}/${testName ? `${testName}.xml` : "all.xml"}`;
  ensureParentDir(destination);
  return {
    args: [
      `--test-reporter=${consoleReporter}`,
      `--test-reporter=${defaultReporter}`,
      "--test-reporter-destination=stdout",
      `--test-reporter-destination=${destination}`,
    ],
    destination,
  };
};

const runNodeTests = (files: string[], reporterArgs: string[]) =>
  spawnSync(
    process.execPath,
    ["--test", ...extraArgs, ...reporterArgs, ...files],
    {
      stdio: "inherit",
      env: {
        ...process.env,
        NODE_OPTIONS: nodeOptions,
        NODE_V8_COVERAGE: testsCoverage,
      },
    },
  );

const waitForServer = async (url: string, timeoutMs = 30_000) => {
  const start = Date.now();
  while (Date.now() - start < timeoutMs) {
    try {
      const controller = new AbortController();
      const timer = setTimeout(() => controller.abort(), 2_000);
      const res = await fetch(url, { signal: controller.signal });
      clearTimeout(timer);
      if (res.ok) return true;
    } catch {
      // retry
    }
    await new Promise((resolve) => setTimeout(resolve, 1_000));
  }
  return false;
};

const startServer = async () => {
  if (serverTarget === "remote") return null;
  if (serverTarget === "local") {
    return spawn(
      process.execPath,
      [`${repoRoot}/packages/server-v4/dist/server.js`],
      {
        stdio: "inherit",
        env: {
          ...process.env,
          NODE_ENV: "development",
          NODE_OPTIONS: nodeOptions,
          NODE_V8_COVERAGE: serverCoverage,
        },
      },
    );
  }

  const defaultName = `stagehand-server-v4-${process.platform}-${process.arch}${process.platform === "win32" ? ".exe" : ""}`;
  const seaBinary = `${repoRoot}/packages/server-v4/dist/sea/${process.env.SEA_BINARY_NAME ?? defaultName}`;

  if (!fs.existsSync(seaBinary)) {
    console.error(`SEA binary not found at ${seaBinary}`);
    process.exit(1);
  }

  return spawn(seaBinary, ["--node-options=--no-lazy --enable-source-maps"], {
    stdio: "inherit",
    env: {
      ...process.env,
      NODE_ENV: "production",
      NODE_V8_COVERAGE: serverCoverage,
      STAGEHAND_SEA_CACHE_DIR:
        process.env.STAGEHAND_SEA_CACHE_DIR ?? `${repoRoot}/.stagehand-sea`,
    },
  });
};

let serverProc: ReturnType<typeof spawn> | null = null;
let status = 0;

if (unitPaths.length > 0) {
  const unitName =
    unitPaths.length === 1 ? toTestName(unitPaths[0], unitDir) : undefined;
  const reporter = reporterArgsFor("unit", unitName);
  const result = runNodeTests(unitPaths, reporter.args);
  status = result.status ?? 1;
  writeCtrfFromJunit(reporter.destination, "node-test");
}

if (status === 0 && integrationPaths.length > 0) {
  serverProc = await startServer();
  const ready = await waitForServer(`${process.env.STAGEHAND_API_URL}/healthz`);
  if (!ready) {
    console.error("Server failed to start within 30 seconds.");
    status = 1;
  } else {
    const integrationName =
      integrationPaths.length === 1
        ? toTestName(integrationPaths[0], integrationDir)
        : undefined;
    const reporter = reporterArgsFor("integration", integrationName);
    const result = runNodeTests(integrationPaths, reporter.args);
    status = result.status ?? 1;
    writeCtrfFromJunit(reporter.destination, "node-test");
  }
}

if (serverProc) {
  serverProc.kill("SIGTERM");
  await new Promise<void>((resolve) => {
    if (serverProc?.exitCode !== null) return resolve();
    const timer = setTimeout(resolve, 10_000);
    serverProc?.once("exit", () => {
      clearTimeout(timer);
      resolve();
    });
  });
  await new Promise((resolve) => setTimeout(resolve, 5_000));
}

process.exit(status);


================================================
FILE: packages/server-v4/src/routes/healthcheck.ts
================================================
import type { RouteOptions } from "fastify";
import { z } from "zod/v4";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

const healthcheckRoute: RouteOptions = {
  method: "GET",
  url: "/healthz",
  logLevel: "silent",
  schema: {
    hide: true, // Hide from OpenAPI spec - utility endpoint
    response: {
      200: z
        .object({
          status: z.string(),
          timestamp: z.string(),
        })
        .strict(),
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: async () => ({
    status: "ok",
    timestamp: new Date().toISOString(),
  }),
};

export default healthcheckRoute;


================================================
FILE: packages/server-v4/src/routes/readiness.ts
================================================
import type { RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import { z } from "zod/v4";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

// Server readiness state management
let isReady = false;

/**
 * Get the current readiness state of the server
 * @returns {boolean} Whether the server is ready to accept requests
 */
export const getIsReady = (): boolean => {
  return isReady;
};

/**
 * Mark the server as ready to accept requests
 */
export const setReady = (): void => {
  isReady = true;
};

/**
 * Mark the server as not ready to accept requests
 * Used during graceful shutdown to stop accepting new requests
 */
export const setUnready = (): void => {
  isReady = false;
};

const readinessRoute: RouteOptions = {
  method: "GET",
  url: "/readyz",
  logLevel: "silent",
  schema: {
    hide: true, // Hide from OpenAPI spec - utility endpoint
    response: {
      200: z.string(),
      503: z.string(),
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: async (_request, reply) => {
    if (!isReady) {
      return reply
        .code(StatusCodes.SERVICE_UNAVAILABLE)
        .send("Service Unavailable");
    }
    return reply.code(StatusCodes.OK).send("Ready");
  },
};

export default readinessRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/_id/end.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionEndRequestSchema,
  BrowserSessionHeadersSchema,
  BrowserSessionIdParamsSchema,
  BrowserSessionResponseSchema,
  type BrowserSessionIdParams,
} from "../../../../schemas/v4/browserSession.js";
import { buildBrowserSession } from "../shared.js";

const endBrowserSessionHandler: RouteHandlerMethod = async (request, reply) => {
  const { id } = request.params as BrowserSessionIdParams;

  return reply.status(StatusCodes.OK).send(
    BrowserSessionResponseSchema.parse({
      success: true,
      data: {
        browserSession: buildBrowserSession({
          id,
          env: "LOCAL",
          status: "ended",
          modelName: "stub/model",
          cdpUrl: "ws://stub.invalid/devtools/browser/stub",
          available: false,
        }),
      },
    }),
  );
};

const endBrowserSessionRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/:id/end",
  schema: {
    operationId: "BrowserSessionEnd",
    summary: "End a browser session",
    headers: BrowserSessionHeadersSchema,
    params: BrowserSessionIdParamsSchema,
    body: BrowserSessionEndRequestSchema,
    response: {
      200: BrowserSessionResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: endBrowserSessionHandler,
};

export default endBrowserSessionRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/_id/index.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionHeadersSchema,
  BrowserSessionIdParamsSchema,
  BrowserSessionResponseSchema,
  type BrowserSessionIdParams,
} from "../../../../schemas/v4/browserSession.js";
import { buildBrowserSession } from "../shared.js";

const getBrowserSessionHandler: RouteHandlerMethod = async (request, reply) => {
  const { id } = request.params as BrowserSessionIdParams;

  return reply.status(StatusCodes.OK).send(
    BrowserSessionResponseSchema.parse({
      success: true,
      data: {
        browserSession: buildBrowserSession({
          id,
          env: "LOCAL",
          status: "running",
          modelName: "stub/model",
          cdpUrl: "ws://stub.invalid/devtools/browser/stub",
          available: false,
        }),
      },
    }),
  );
};

const getBrowserSessionRoute: RouteOptions = {
  method: "GET",
  url: "/browsersession/:id",
  schema: {
    operationId: "BrowserSessionStatus",
    summary: "Get browser session status",
    headers: BrowserSessionHeadersSchema,
    params: BrowserSessionIdParamsSchema,
    response: {
      200: BrowserSessionResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: getBrowserSessionHandler,
};

export default getBrowserSessionRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/action/_actionId.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionActionDetailsQuerySchema,
  BrowserSessionActionDetailsResponseSchema,
  BrowserSessionActionIdParamsSchema,
  BrowserSessionHeadersSchema,
} from "../../../../schemas/v4/browserSession.js";
import {
  browserSessionActionDetailsHandler,
  browserSessionActionErrorResponses,
} from "../shared.js";

const browserSessionActionDetailsRoute: RouteOptions = {
  method: "GET",
  url: "/browsersession/action/:actionId",
  schema: {
    operationId: "BrowserSessionActionDetails",
    summary: "browserSession.action",
    headers: BrowserSessionHeadersSchema,
    params: BrowserSessionActionIdParamsSchema,
    querystring: BrowserSessionActionDetailsQuerySchema,
    response: {
      200: BrowserSessionActionDetailsResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: browserSessionActionDetailsHandler,
};

export default browserSessionActionDetailsRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/action/index.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionActionListQuerySchema,
  BrowserSessionActionListResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  browserSessionActionListHandler,
} from "../shared.js";

const browserSessionActionListRoute: RouteOptions = {
  method: "GET",
  url: "/browsersession/action",
  schema: {
    operationId: "BrowserSessionActionList",
    summary: "browserSession.actions",
    headers: BrowserSessionHeadersSchema,
    querystring: BrowserSessionActionListQuerySchema,
    response: {
      200: BrowserSessionActionListResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: browserSessionActionListHandler,
};

export default browserSessionActionListRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/activePage.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionActivePageActionSchema,
  BrowserSessionOptionalPageResultSchema,
  BrowserSessionActivePageRequestSchema,
  BrowserSessionActivePageResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  buildStubBrowserSessionPage,
  createBrowserSessionActionHandler,
} from "./shared.js";

const activePageRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/activePage",
  schema: {
    operationId: "BrowserSessionActivePage",
    summary: "browserSession.activePage",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionActivePageRequestSchema,
    response: {
      200: BrowserSessionActivePageResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "activePage",
    actionSchema: BrowserSessionActivePageActionSchema,
    execute: async ({ sessionId }) => {
      const page = buildStubBrowserSessionPage(sessionId);
      return {
        pageId: page.pageId,
        result: BrowserSessionOptionalPageResultSchema.parse({ page }),
      };
    },
  }),
};

export default activePageRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/addCookies.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionAddCookiesActionSchema,
  BrowserSessionAddCookiesResultSchema,
  BrowserSessionAddCookiesRequestSchema,
  BrowserSessionAddCookiesResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const addCookiesRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/addCookies",
  schema: {
    operationId: "BrowserSessionAddCookies",
    summary: "browserSession.addCookies",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionAddCookiesRequestSchema,
    response: {
      200: BrowserSessionAddCookiesResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "addCookies",
    actionSchema: BrowserSessionAddCookiesActionSchema,
    execute: async ({ params }) => {
      return {
        result: BrowserSessionAddCookiesResultSchema.parse({
          added: params.cookies.length,
        }),
      };
    },
  }),
};

export default addCookiesRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/addInitScript.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionAddInitScriptActionSchema,
  BrowserSessionAddInitScriptResultSchema,
  BrowserSessionAddInitScriptRequestSchema,
  BrowserSessionAddInitScriptResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const addInitScriptRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/addInitScript",
  schema: {
    operationId: "BrowserSessionAddInitScript",
    summary: "browserSession.addInitScript",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionAddInitScriptRequestSchema,
    response: {
      200: BrowserSessionAddInitScriptResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "addInitScript",
    actionSchema: BrowserSessionAddInitScriptActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionAddInitScriptResultSchema.parse({ added: true }),
      };
    },
  }),
};

export default addInitScriptRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/awaitActivePage.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionAwaitActivePageActionSchema,
  BrowserSessionPageResultSchema,
  BrowserSessionAwaitActivePageRequestSchema,
  BrowserSessionAwaitActivePageResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  buildStubBrowserSessionPage,
  createBrowserSessionActionHandler,
} from "./shared.js";

const awaitActivePageRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/awaitActivePage",
  schema: {
    operationId: "BrowserSessionAwaitActivePage",
    summary: "browserSession.awaitActivePage",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionAwaitActivePageRequestSchema,
    response: {
      200: BrowserSessionAwaitActivePageResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "awaitActivePage",
    actionSchema: BrowserSessionAwaitActivePageActionSchema,
    execute: async ({ sessionId }) => {
      const page = buildStubBrowserSessionPage(sessionId);
      return {
        pageId: page.pageId,
        result: BrowserSessionPageResultSchema.parse({ page }),
      };
    },
  }),
};

export default awaitActivePageRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/browserbaseDebugURL.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionBrowserbaseDebugURLActionSchema,
  BrowserSessionBrowserbaseDebugURLResultSchema,
  BrowserSessionBrowserbaseDebugURLRequestSchema,
  BrowserSessionBrowserbaseDebugURLResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const browserbaseDebugURLRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/browserbaseDebugURL",
  schema: {
    operationId: "BrowserSessionBrowserbaseDebugURL",
    summary: "browserSession.browserbaseDebugURL",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionBrowserbaseDebugURLRequestSchema,
    response: {
      200: BrowserSessionBrowserbaseDebugURLResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "browserbaseDebugURL",
    actionSchema: BrowserSessionBrowserbaseDebugURLActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionBrowserbaseDebugURLResultSchema.parse({
          browserbaseDebugURL: "https://stub.invalid/debug",
        }),
      };
    },
  }),
};

export default browserbaseDebugURLRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/browserbaseSessionID.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionBrowserbaseSessionIDActionSchema,
  BrowserSessionBrowserbaseSessionIDResultSchema,
  BrowserSessionBrowserbaseSessionIDRequestSchema,
  BrowserSessionBrowserbaseSessionIDResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const browserbaseSessionIDRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/browserbaseSessionID",
  schema: {
    operationId: "BrowserSessionBrowserbaseSessionID",
    summary: "browserSession.browserbaseSessionID",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionBrowserbaseSessionIDRequestSchema,
    response: {
      200: BrowserSessionBrowserbaseSessionIDResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "browserbaseSessionID",
    actionSchema: BrowserSessionBrowserbaseSessionIDActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionBrowserbaseSessionIDResultSchema.parse({
          browserbaseSessionID: "bb_session_stub",
        }),
      };
    },
  }),
};

export default browserbaseSessionIDRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/browserbaseSessionURL.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionBrowserbaseSessionURLActionSchema,
  BrowserSessionBrowserbaseSessionURLResultSchema,
  BrowserSessionBrowserbaseSessionURLRequestSchema,
  BrowserSessionBrowserbaseSessionURLResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const browserbaseSessionURLRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/browserbaseSessionURL",
  schema: {
    operationId: "BrowserSessionBrowserbaseSessionURL",
    summary: "browserSession.browserbaseSessionURL",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionBrowserbaseSessionURLRequestSchema,
    response: {
      200: BrowserSessionBrowserbaseSessionURLResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "browserbaseSessionURL",
    actionSchema: BrowserSessionBrowserbaseSessionURLActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionBrowserbaseSessionURLResultSchema.parse({
          browserbaseSessionURL: "https://browserbase.com/sessions/stub",
        }),
      };
    },
  }),
};

export default browserbaseSessionURLRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/clearCookies.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionClearCookiesActionSchema,
  BrowserSessionClearCookiesResultSchema,
  BrowserSessionClearCookiesRequestSchema,
  BrowserSessionClearCookiesResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const clearCookiesRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/clearCookies",
  schema: {
    operationId: "BrowserSessionClearCookies",
    summary: "browserSession.clearCookies",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionClearCookiesRequestSchema,
    response: {
      200: BrowserSessionClearCookiesResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "clearCookies",
    actionSchema: BrowserSessionClearCookiesActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionClearCookiesResultSchema.parse({ cleared: true }),
      };
    },
  }),
};

export default clearCookiesRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/configuredViewport.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionConfiguredViewportActionSchema,
  BrowserSessionConfiguredViewportResultSchema,
  BrowserSessionConfiguredViewportRequestSchema,
  BrowserSessionConfiguredViewportResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  buildStubViewport,
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const configuredViewportRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/configuredViewport",
  schema: {
    operationId: "BrowserSessionConfiguredViewport",
    summary: "browserSession.configuredViewport",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionConfiguredViewportRequestSchema,
    response: {
      200: BrowserSessionConfiguredViewportResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "configuredViewport",
    actionSchema: BrowserSessionConfiguredViewportActionSchema,
    execute: async () => {
      return {
        result:
          BrowserSessionConfiguredViewportResultSchema.parse(
            buildStubViewport(),
          ),
      };
    },
  }),
};

export default configuredViewportRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/connectURL.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionConnectURLActionSchema,
  BrowserSessionConnectURLResultSchema,
  BrowserSessionConnectURLRequestSchema,
  BrowserSessionConnectURLResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const connectURLRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/connectURL",
  schema: {
    operationId: "BrowserSessionConnectURL",
    summary: "browserSession.connectURL",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionConnectURLRequestSchema,
    response: {
      200: BrowserSessionConnectURLResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "connectURL",
    actionSchema: BrowserSessionConnectURLActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionConnectURLResultSchema.parse({
          connectURL: "ws://stub.invalid/connect",
        }),
      };
    },
  }),
};

export default connectURLRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/cookies.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionCookiesActionSchema,
  BrowserSessionCookiesResultSchema,
  BrowserSessionCookiesRequestSchema,
  BrowserSessionCookiesResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  buildStubBrowserSessionCookie,
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const cookiesRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/cookies",
  schema: {
    operationId: "BrowserSessionCookies",
    summary: "browserSession.cookies",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionCookiesRequestSchema,
    response: {
      200: BrowserSessionCookiesResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "cookies",
    actionSchema: BrowserSessionCookiesActionSchema,
    execute: async () => {
      return {
        result: BrowserSessionCookiesResultSchema.parse({
          cookies: [buildStubBrowserSessionCookie()],
        }),
      };
    },
  }),
};

export default cookiesRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/getFullFrameTreeByMainFrameId.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionGetFullFrameTreeByMainFrameIdActionSchema,
  BrowserSessionFrameTreeResultSchema,
  BrowserSessionGetFullFrameTreeByMainFrameIdRequestSchema,
  BrowserSessionGetFullFrameTreeByMainFrameIdResponseSchema,
  BrowserSessionHeadersSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const getFullFrameTreeByMainFrameIdRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/getFullFrameTreeByMainFrameId",
  schema: {
    operationId: "BrowserSessionGetFullFrameTreeByMainFrameId",
    summary: "browserSession.getFullFrameTreeByMainFrameId",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionGetFullFrameTreeByMainFrameIdRequestSchema,
    response: {
      200: BrowserSessionGetFullFrameTreeByMainFrameIdResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "getFullFrameTreeByMainFrameId",
    actionSchema: BrowserSessionGetFullFrameTreeByMainFrameIdActionSchema,
    execute: async ({ params }) => {
      return {
        pageId: "page_stub",
        result: BrowserSessionFrameTreeResultSchema.parse({
          frameTree: { mainFrameId: params.mainFrameId, children: [] },
        }),
      };
    },
  }),
};

export default getFullFrameTreeByMainFrameIdRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/index.ts
================================================
import type { RouteHandlerMethod, RouteOptions } from "fastify";
import { StatusCodes } from "http-status-codes";
import { type FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionCreateRequestSchema,
  BrowserSessionErrorResponseSchema,
  BrowserSessionHeadersSchema,
  BrowserSessionResponseSchema,
  type BrowserSessionCreateRequest,
} from "../../../schemas/v4/browserSession.js";
import { buildBrowserSession } from "./shared.js";

const createBrowserSessionHandler: RouteHandlerMethod = async (
  request,
  reply,
) => {
  const body = request.body as BrowserSessionCreateRequest;
  const env = body.env === "BROWSERBASE" ? "BROWSERBASE" : "LOCAL";
  const cdpUrl = "cdpUrl" in body ? body.cdpUrl : undefined;
  const browserbaseSessionId =
    "browserbaseSessionId" in body ? body.browserbaseSessionId : undefined;
  const browserbaseSessionCreateParams =
    "browserbaseSessionCreateParams" in body
      ? body.browserbaseSessionCreateParams
      : undefined;
  const localBrowserLaunchOptions =
    "localBrowserLaunchOptions" in body
      ? body.localBrowserLaunchOptions
      : undefined;

  return reply.status(StatusCodes.OK).send(
    BrowserSessionResponseSchema.parse({
      success: true,
      data: {
        browserSession: buildBrowserSession({
          id: "session_stub",
          env,
          status: "running",
          modelName: body.modelName,
          cdpUrl:
            env === "LOCAL"
              ? (cdpUrl ?? "ws://stub.invalid/devtools/browser/stub")
              : "ws://stub.invalid/devtools/browser/stub",
          available: false,
          browserbaseSessionId,
          browserbaseSessionCreateParams,
          localBrowserLaunchOptions,
          domSettleTimeoutMs: body.domSettleTimeoutMs,
          verbose: body.verbose,
          systemPrompt: body.systemPrompt,
          selfHeal: body.selfHeal,
          waitForCaptchaSolves: body.waitForCaptchaSolves,
          experimental: body.experimental,
          actTimeoutMs: body.actTimeoutMs,
        }),
      },
    }),
  );
};

const createBrowserSessionRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession",
  schema: {
    operationId: "BrowserSessionCreate",
    summary: "Create a browser session",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionCreateRequestSchema,
    response: {
      200: BrowserSessionResponseSchema,
      400: BrowserSessionErrorResponseSchema,
      401: BrowserSessionErrorResponseSchema,
      500: BrowserSessionErrorResponseSchema,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionHandler,
};

export default createBrowserSessionRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/newPage.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionHeadersSchema,
  BrowserSessionNewPageActionSchema,
  BrowserSessionPageResultSchema,
  BrowserSessionNewPageRequestSchema,
  BrowserSessionNewPageResponseSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  buildStubBrowserSessionPage,
  createBrowserSessionActionHandler,
} from "./shared.js";

const newPageRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/newPage",
  schema: {
    operationId: "BrowserSessionNewPage",
    summary: "browserSession.newPage",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionNewPageRequestSchema,
    response: {
      200: BrowserSessionNewPageResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "newPage",
    actionSchema: BrowserSessionNewPageActionSchema,
    execute: async ({ sessionId, params }) => {
      const page = buildStubBrowserSessionPage(sessionId, { url: params.url });
      return {
        pageId: page.pageId,
        result: BrowserSessionPageResultSchema.parse({ page }),
      };
    },
  }),
};

export default newPageRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/pages.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionHeadersSchema,
  BrowserSessionPagesActionSchema,
  BrowserSessionPagesResultSchema,
  BrowserSessionPagesRequestSchema,
  BrowserSessionPagesResponseSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  buildStubBrowserSessionPage,
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const pagesRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/pages",
  schema: {
    operationId: "BrowserSessionPages",
    summary: "browserSession.pages",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionPagesRequestSchema,
    response: {
      200: BrowserSessionPagesResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "pages",
    actionSchema: BrowserSessionPagesActionSchema,
    execute: async ({ sessionId }) => {
      return {
        result: BrowserSessionPagesResultSchema.parse({
          pages: [buildStubBrowserSessionPage(sessionId)],
        }),
      };
    },
  }),
};

export default pagesRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/resolvePageByMainFrameId.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionHeadersSchema,
  BrowserSessionResolvePageByMainFrameIdActionSchema,
  BrowserSessionOptionalPageResultSchema,
  BrowserSessionResolvePageByMainFrameIdRequestSchema,
  BrowserSessionResolvePageByMainFrameIdResponseSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  buildStubBrowserSessionPage,
  createBrowserSessionActionHandler,
} from "./shared.js";

const resolvePageByMainFrameIdRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/resolvePageByMainFrameId",
  schema: {
    operationId: "BrowserSessionResolvePageByMainFrameId",
    summary: "browserSession.resolvePageByMainFrameId",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionResolvePageByMainFrameIdRequestSchema,
    response: {
      200: BrowserSessionResolvePageByMainFrameIdResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "resolvePageByMainFrameId",
    actionSchema: BrowserSessionResolvePageByMainFrameIdActionSchema,
    execute: async ({ sessionId }) => {
      const page = buildStubBrowserSessionPage(sessionId);
      return {
        pageId: page.pageId,
        result: BrowserSessionOptionalPageResultSchema.parse({ page }),
      };
    },
  }),
};

export default resolvePageByMainFrameIdRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/routes.ts
================================================
import type { FastifyPluginCallback, RouteOptions } from "fastify";

import browserSessionActionDetailsRoute from "./action/_actionId.js";
import browserSessionActionListRoute from "./action/index.js";
import activePageRoute from "./activePage.js";
import addCookiesRoute from "./addCookies.js";
import addInitScriptRoute from "./addInitScript.js";
import awaitActivePageRoute from "./awaitActivePage.js";
import browserbaseDebugURLRoute from "./browserbaseDebugURL.js";
import browserbaseSessionIDRoute from "./browserbaseSessionID.js";
import browserbaseSessionURLRoute from "./browserbaseSessionURL.js";
import clearCookiesRoute from "./clearCookies.js";
import configuredViewportRoute from "./configuredViewport.js";
import connectURLRoute from "./connectURL.js";
import cookiesRoute from "./cookies.js";
import endBrowserSessionRoute from "./_id/end.js";
import getBrowserSessionRoute from "./_id/index.js";
import getFullFrameTreeByMainFrameIdRoute from "./getFullFrameTreeByMainFrameId.js";
import createBrowserSessionRoute from "./index.js";
import newPageRoute from "./newPage.js";
import pagesRoute from "./pages.js";
import resolvePageByMainFrameIdRoute from "./resolvePageByMainFrameId.js";
import setExtraHTTPHeadersRoute from "./setExtraHTTPHeaders.js";
import { buildBrowserSessionErrorResponse } from "../../../schemas/v4/browserSession.js";
import { normalizePluginError, withTag } from "../pluginUtils.js";

const rawBrowserSessionRoutes: RouteOptions[] = [
  createBrowserSessionRoute,
  getBrowserSessionRoute,
  endBrowserSessionRoute,
  addInitScriptRoute,
  setExtraHTTPHeadersRoute,
  pagesRoute,
  activePageRoute,
  awaitActivePageRoute,
  resolvePageByMainFrameIdRoute,
  getFullFrameTreeByMainFrameIdRoute,
  newPageRoute,
  cookiesRoute,
  addCookiesRoute,
  clearCookiesRoute,
  connectURLRoute,
  configuredViewportRoute,
  browserbaseSessionIDRoute,
  browserbaseSessionURLRoute,
  browserbaseDebugURLRoute,
  browserSessionActionListRoute,
  browserSessionActionDetailsRoute,
];

export const browserSessionRoutes: RouteOptions[] = rawBrowserSessionRoutes.map(
  (route) => withTag(route, "browserSession"),
);

export const browserSessionRoutesPlugin: FastifyPluginCallback = (
  instance,
  _opts,
  done,
) => {
  instance.setErrorHandler((error, _request, reply) => {
    const { errorMessage, stack, statusCode } = normalizePluginError(error);

    return reply.status(statusCode).send(
      buildBrowserSessionErrorResponse({
        error: errorMessage,
        statusCode,
        stack,
      }),
    );
  });

  for (const route of browserSessionRoutes) {
    instance.route(route);
  }

  done();
};


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/setExtraHTTPHeaders.ts
================================================
import type { RouteOptions } from "fastify";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  BrowserSessionHeadersSchema,
  BrowserSessionSetExtraHTTPHeadersActionSchema,
  BrowserSessionSetExtraHTTPHeadersResultSchema,
  BrowserSessionSetExtraHTTPHeadersRequestSchema,
  BrowserSessionSetExtraHTTPHeadersResponseSchema,
} from "../../../schemas/v4/browserSession.js";
import {
  browserSessionActionErrorResponses,
  createBrowserSessionActionHandler,
} from "./shared.js";

const setExtraHTTPHeadersRoute: RouteOptions = {
  method: "POST",
  url: "/browsersession/setExtraHTTPHeaders",
  schema: {
    operationId: "BrowserSessionSetExtraHTTPHeaders",
    summary: "browserSession.setExtraHTTPHeaders",
    headers: BrowserSessionHeadersSchema,
    body: BrowserSessionSetExtraHTTPHeadersRequestSchema,
    response: {
      200: BrowserSessionSetExtraHTTPHeadersResponseSchema,
      ...browserSessionActionErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createBrowserSessionActionHandler({
    method: "setExtraHTTPHeaders",
    actionSchema: BrowserSessionSetExtraHTTPHeadersActionSchema,
    execute: async ({ params }) => {
      return {
        result: BrowserSessionSetExtraHTTPHeadersResultSchema.parse({
          headers: params.headers,
        }),
      };
    },
  }),
};

export default setExtraHTTPHeadersRoute;


================================================
FILE: packages/server-v4/src/routes/v4/browsersession/shared.ts
================================================
import { randomUUID } from "node:crypto";

import type { RouteHandlerMethod } from "fastify";
import { StatusCodes } from "http-status-codes";
import { z } from "zod/v4";

import {
  type BrowserSession,
  type BrowserSessionAction,
  BrowserSessionPagesActionSchema,
  type BrowserSessionActionDetailsQuery,
  type BrowserSessionActionMethod,
  type BrowserSessionPage,
  BrowserSessionSchema,
  BrowserSessionV4ErrorResponseSchema,
} from "../../../schemas/v4/browserSession.js";

export function buildBrowserSession(input: {
  id: string;
  env: BrowserSession["env"];
  status: "running" | "ended";
  available: boolean;
  modelName: string;
  cdpUrl?: string | null;
  browserbaseSessionId?: string;
  browserbaseSessionCreateParams?: BrowserSession["browserbaseSessionCreateParams"];
  localBrowserLaunchOptions?: BrowserSession["localBrowserLaunchOptions"];
  domSettleTimeoutMs?: number;
  verbose?: BrowserSession["verbose"];
  systemPrompt?: string;
  selfHeal?: boolean;
  waitForCaptchaSolves?: boolean;
  experimental?: boolean;
  actTimeoutMs?: number;
}): BrowserSession {
  return BrowserSessionSchema.parse({
    id: input.id,
    env: input.env,
    status: input.status,
    modelName: input.modelName,
    cdpUrl: input.cdpUrl ?? "ws://stub.invalid/devtools/browser/stub",
    available: input.available,
    browserbaseSessionId: input.browserbaseSessionId,
    browserbaseSessionCreateParams: input.browserbaseSessionCreateParams,
    localBrowserLaunchOptions: input.localBrowserLaunchOptions,
    domSettleTimeoutMs: input.domSettleTimeoutMs,
    verbose: input.verbose,
    systemPrompt: input.systemPrompt,
    selfHeal: input.selfHeal,
    waitForCaptchaSolves: input.waitForCaptchaSolves,
    experimental: input.experimental,
    actTimeoutMs: input.actTimeoutMs,
  });
}

export const browserSessionActionErrorResponses = {
  400: BrowserSessionV4ErrorResponseSchema,
  401: BrowserSessionV4ErrorResponseSchema,
  404: BrowserSessionV4ErrorResponseSchema,
  408: BrowserSessionV4ErrorResponseSchema,
  422: BrowserSessionV4ErrorResponseSchema,
  500: BrowserSessionV4ErrorResponseSchema,
};

type BrowserSessionRequestBody<TAction extends BrowserSessionAction> = {
  sessionId: string;
  params: TAction["params"];
};

type BrowserSessionActionHandlerContext<TAction extends BrowserSessionAction> =
  {
    params: TAction["params"];
    request: Parameters<RouteHandlerMethod>[0];
    sessionId: string;
    sessionStore: unknown;
  };

type BrowserSessionActionExecutionResult<TAction extends BrowserSessionAction> =
  {
    result: TAction["result"];
    pageId?: string;
  };

export function buildBrowserSessionPage(page: {
  mainFrameId(): string;
  targetId(): string;
  url(): string;
}): BrowserSessionPage {
  const targetId = page.targetId();
  return {
    pageId: targetId,
    targetId,
    mainFrameId: page.mainFrameId(),
    url: page.url(),
  };
}

export function buildStubBrowserSessionPage(
  sessionId: string,
  input?: { pageId?: string; url?: string },
): BrowserSessionPage {
  const pageId = input?.pageId ?? "page_stub";

  return {
    pageId,
    targetId: pageId,
    mainFrameId: "frame_stub",
    url: input?.url ?? `https://stub.invalid/${sessionId}`,
  };
}

export function buildStubBrowserSessionCookie() {
  return {
    name: "stub_cookie",
    value: "stub_value",
    domain: "stub.invalid",
    path: "/",
    expires: 0,
    httpOnly: false,
    secure: true,
    sameSite: "Lax" as const,
  };
}

export function buildStubViewport() {
  return {
    width: 1280,
    height: 720,
    deviceScaleFactor: 1,
  };
}

function getInitialPageId(params: unknown): string | undefined {
  if (
    typeof params === "object" &&
    params !== null &&
    "pageId" in params &&
    typeof (params as { pageId?: unknown }).pageId === "string"
  ) {
    return (params as { pageId: string }).pageId;
  }

  return undefined;
}

export function toStringOrRegExp(
  value?:
    | string
    | {
        source: string;
        flags?: string;
      },
): string | RegExp | undefined {
  if (!value) {
    return undefined;
  }

  if (typeof value === "string") {
    return value;
  }

  return new RegExp(value.source, value.flags);
}

export function createBrowserSessionActionHandler<
  TAction extends BrowserSessionAction,
>(options: {
  actionSchema: z.ZodType<TAction>;
  execute: (
    ctx: BrowserSessionActionHandlerContext<TAction>,
  ) => Promise<BrowserSessionActionExecutionResult<TAction>>;
  method: BrowserSessionActionMethod;
}): RouteHandlerMethod {
  const { actionSchema, method } = options;

  return async (request, reply) => {
    const { params, sessionId } =
      request.body as BrowserSessionRequestBody<TAction>;
    const execution = await options.execute({
      params,
      request,
      sessionId,
      sessionStore: undefined,
    });
    const createdAt = new Date().toISOString();
    const action = actionSchema.parse({
      id: randomUUID(),
      method,
      status: "completed",
      sessionId,
      pageId: execution.pageId ?? getInitialPageId(params),
      createdAt,
      updatedAt: createdAt,
      completedAt: createdAt,
      error: null,
      params,
      result: execution.result,
    });

    return reply.status(StatusCodes.OK).send({
      success: true,
      error: null,
      action,
    });
  };
}

export const browserSessionActionDetailsHandler: RouteHandlerMethod = async (
  request,
  reply,
) => {
  const { actionId } = request.params as { actionId: string };
  const { sessionId } = request.query as BrowserSessionActionDetailsQuery;
  const createdAt = new Date().toISOString();
  const action = BrowserSessionPagesActionSchema.parse({
    id: actionId,
    method: "pages",
    status: "completed",
    sessionId,
    createdAt,
    updatedAt: createdAt,
    completedAt: createdAt,
    error: null,
    params: {},
    result: {
      pages: [buildStubBrowserSessionPage(sessionId)],
    },
  });

  return reply.status(StatusCodes.OK).send({
    success: true,
    error: null,
    action,
  });
};

export const browserSessionActionListHandler: RouteHandlerMethod = async (
  request,
  reply,
) => {
  const { sessionId } = request.query as BrowserSessionActionDetailsQuery;
  const createdAt = new Date().toISOString();
  return reply.status(StatusCodes.OK).send({
    success: true,
    error: null,
    actions: [
      BrowserSessionPagesActionSchema.parse({
        id: randomUUID(),
        method: "pages",
        status: "completed",
        sessionId,
        createdAt,
        updatedAt: createdAt,
        completedAt: createdAt,
        error: null,
        params: {},
        result: {
          pages: [buildStubBrowserSessionPage(sessionId)],
        },
      }),
    ],
  });
};


================================================
FILE: packages/server-v4/src/routes/v4/page/action/_actionId.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageActionDetailsQuerySchema,
  PageActionDetailsResponseSchema,
  PageActionIdParamsSchema,
} from "../../../../schemas/v4/page.js";
import { pageActionDetailsHandler, pageErrorResponses } from "../shared.js";

const pageActionDetailsRoute: RouteOptions = {
  method: "GET",
  url: "/page/action/:actionId",
  schema: {
    operationId: "PageActionDetails",
    summary: "page.actionById",
    headers: Api.SessionHeadersSchema,
    params: PageActionIdParamsSchema,
    querystring: PageActionDetailsQuerySchema,
    response: {
      200: PageActionDetailsResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: pageActionDetailsHandler,
};

export default pageActionDetailsRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/action/index.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageActionListQuerySchema,
  PageActionListResponseSchema,
} from "../../../../schemas/v4/page.js";
import { pageActionListHandler, pageErrorResponses } from "../shared.js";

const pageActionListRoute: RouteOptions = {
  method: "GET",
  url: "/page/action",
  schema: {
    operationId: "PageActionList",
    summary: "page.action",
    headers: Api.SessionHeadersSchema,
    querystring: PageActionListQuerySchema,
    response: {
      200: PageActionListResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: pageActionListHandler,
};

export default pageActionListRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/addInitScript.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageAddInitScriptActionSchema,
  PageAddInitScriptResultSchema,
  PageAddInitScriptRequestSchema,
  PageAddInitScriptResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const addInitScriptRoute: RouteOptions = {
  method: "POST",
  url: "/page/addInitScript",
  schema: {
    operationId: "PageAddInitScript",
    summary: "page.addInitScript",
    headers: Api.SessionHeadersSchema,
    body: PageAddInitScriptRequestSchema,
    response: {
      200: PageAddInitScriptResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "addInitScript",
    actionSchema: PageAddInitScriptActionSchema,
    execute: async () => {
      return PageAddInitScriptResultSchema.parse({ added: true });
    },
  }),
};

export default addInitScriptRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/asProtocolFrameTree.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageAsProtocolFrameTreeActionSchema,
  PageFrameTreeResultSchema,
  PageAsProtocolFrameTreeRequestSchema,
  PageAsProtocolFrameTreeResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const asProtocolFrameTreeRoute: RouteOptions = {
  method: "GET",
  url: "/page/asProtocolFrameTree",
  schema: {
    operationId: "PageAsProtocolFrameTree",
    summary: "page.asProtocolFrameTree",
    headers: Api.SessionHeadersSchema,
    querystring: PageAsProtocolFrameTreeRequestSchema,
    response: {
      200: PageAsProtocolFrameTreeResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "asProtocolFrameTree",
    actionSchema: PageAsProtocolFrameTreeActionSchema,
    execute: async ({ params }) => {
      return PageFrameTreeResultSchema.parse({
        frameTree: {
          rootMainFrameId: params.rootMainFrameId,
          children: [],
        },
      });
    },
  }),
};

export default asProtocolFrameTreeRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/click.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageClickActionSchema,
  PageClickRequestSchema,
  PageClickResponseSchema,
  PageXPathResultSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const clickRoute: RouteOptions = {
  method: "POST",
  url: "/page/click",
  schema: {
    operationId: "PageClick",
    summary: "page.click",
    headers: Api.SessionHeadersSchema,
    body: PageClickRequestSchema,
    response: {
      200: PageClickResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "click",
    actionSchema: PageClickActionSchema,
    execute: async ({ params }) => {
      const sel = params.selector;
      return PageXPathResultSchema.parse({
        xpath: "xpath" in sel ? sel.xpath : "xpath=//stub-click",
      });
    },
  }),
};

export default clickRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/close.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageCloseActionSchema,
  PageCloseResultSchema,
  PageCloseRequestSchema,
  PageCloseResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const closeRoute: RouteOptions = {
  method: "POST",
  url: "/page/close",
  schema: {
    operationId: "PageClose",
    summary: "page.close",
    headers: Api.SessionHeadersSchema,
    body: PageCloseRequestSchema,
    response: {
      200: PageCloseResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "close",
    actionSchema: PageCloseActionSchema,
    execute: async () => {
      return PageCloseResultSchema.parse({ closed: true });
    },
  }),
};

export default closeRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/dragAndDrop.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageDragAndDropActionSchema,
  PageDragAndDropResultSchema,
  PageDragAndDropRequestSchema,
  PageDragAndDropResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const dragAndDropRoute: RouteOptions = {
  method: "POST",
  url: "/page/dragAndDrop",
  schema: {
    operationId: "PageDragAndDrop",
    summary: "page.dragAndDrop",
    headers: Api.SessionHeadersSchema,
    body: PageDragAndDropRequestSchema,
    response: {
      200: PageDragAndDropResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "dragAndDrop",
    actionSchema: PageDragAndDropActionSchema,
    execute: async ({ params }) => {
      return PageDragAndDropResultSchema.parse({
        fromXpath:
          "xpath" in params.from ? params.from.xpath : "xpath=//stub-from",
        toXpath: "xpath" in params.to ? params.to.xpath : "xpath=//stub-to",
      });
    },
  }),
};

export default dragAndDropRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/enableCursorOverlay.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageEnableCursorOverlayActionSchema,
  PageEnableCursorOverlayResultSchema,
  PageEnableCursorOverlayRequestSchema,
  PageEnableCursorOverlayResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const enableCursorOverlayRoute: RouteOptions = {
  method: "POST",
  url: "/page/enableCursorOverlay",
  schema: {
    operationId: "PageEnableCursorOverlay",
    summary: "page.enableCursorOverlay",
    headers: Api.SessionHeadersSchema,
    body: PageEnableCursorOverlayRequestSchema,
    response: {
      200: PageEnableCursorOverlayResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "enableCursorOverlay",
    actionSchema: PageEnableCursorOverlayActionSchema,
    execute: async () => {
      return PageEnableCursorOverlayResultSchema.parse({ enabled: true });
    },
  }),
};

export default enableCursorOverlayRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/evaluate.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageEvaluateActionSchema,
  PageEvaluateResultSchema,
  PageEvaluateRequestSchema,
  PageEvaluateResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const evaluateRoute: RouteOptions = {
  method: "POST",
  url: "/page/evaluate",
  schema: {
    operationId: "PageEvaluate",
    summary: "page.evaluate",
    headers: Api.SessionHeadersSchema,
    body: PageEvaluateRequestSchema,
    response: {
      200: PageEvaluateResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "evaluate",
    actionSchema: PageEvaluateActionSchema,
    execute: async ({ params }) => {
      return PageEvaluateResultSchema.parse({
        value: {
          expression: params.expression,
          arg: params.arg ?? null,
        },
      });
    },
  }),
};

export default evaluateRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/frames.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageFramesActionSchema,
  PageFramesResultSchema,
  PageFramesRequestSchema,
  PageFramesResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  buildStubPageFrame,
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const framesRoute: RouteOptions = {
  method: "GET",
  url: "/page/frames",
  schema: {
    operationId: "PageFrames",
    summary: "page.frames",
    headers: Api.SessionHeadersSchema,
    querystring: PageFramesRequestSchema,
    response: {
      200: PageFramesResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "frames",
    actionSchema: PageFramesActionSchema,
    execute: async ({ params }) => {
      return PageFramesResultSchema.parse({
        frames: [buildStubPageFrame(getPageId(params))],
      });
    },
  }),
};

export default framesRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/getFullFrameTree.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageGetFullFrameTreeActionSchema,
  PageFrameTreeResultSchema,
  PageGetFullFrameTreeRequestSchema,
  PageGetFullFrameTreeResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const getFullFrameTreeRoute: RouteOptions = {
  method: "GET",
  url: "/page/getFullFrameTree",
  schema: {
    operationId: "PageGetFullFrameTree",
    summary: "page.getFullFrameTree",
    headers: Api.SessionHeadersSchema,
    querystring: PageGetFullFrameTreeRequestSchema,
    response: {
      200: PageGetFullFrameTreeResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "getFullFrameTree",
    actionSchema: PageGetFullFrameTreeActionSchema,
    execute: async ({ params }) => {
      return PageFrameTreeResultSchema.parse({
        frameTree: {
          pageId: getPageId(params),
          children: [],
        },
      });
    },
  }),
};

export default getFullFrameTreeRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/getOrdinal.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageGetOrdinalActionSchema,
  PageGetOrdinalResultSchema,
  PageGetOrdinalRequestSchema,
  PageGetOrdinalResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const getOrdinalRoute: RouteOptions = {
  method: "GET",
  url: "/page/getOrdinal",
  schema: {
    operationId: "PageGetOrdinal",
    summary: "page.getOrdinal",
    headers: Api.SessionHeadersSchema,
    querystring: PageGetOrdinalRequestSchema,
    response: {
      200: PageGetOrdinalResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "getOrdinal",
    actionSchema: PageGetOrdinalActionSchema,
    execute: async ({ params }) => {
      return PageGetOrdinalResultSchema.parse({
        frameId: params.frameId,
        ordinal: 0,
      });
    },
  }),
};

export default getOrdinalRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/goBack.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageGoBackActionSchema,
  PageNavigationResultSchema,
  PageGoBackRequestSchema,
  PageGoBackResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  buildStubNavigationResult,
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const goBackRoute: RouteOptions = {
  method: "POST",
  url: "/page/goBack",
  schema: {
    operationId: "PageGoBack",
    summary: "page.goBack",
    headers: Api.SessionHeadersSchema,
    body: PageGoBackRequestSchema,
    response: {
      200: PageGoBackResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "goBack",
    actionSchema: PageGoBackActionSchema,
    execute: async ({ params }) => {
      return PageNavigationResultSchema.parse(
        buildStubNavigationResult(`https://stub.invalid/${getPageId(params)}`),
      );
    },
  }),
};

export default goBackRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/goForward.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageGoForwardActionSchema,
  PageNavigationResultSchema,
  PageGoForwardRequestSchema,
  PageGoForwardResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  buildStubNavigationResult,
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const goForwardRoute: RouteOptions = {
  method: "POST",
  url: "/page/goForward",
  schema: {
    operationId: "PageGoForward",
    summary: "page.goForward",
    headers: Api.SessionHeadersSchema,
    body: PageGoForwardRequestSchema,
    response: {
      200: PageGoForwardResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "goForward",
    actionSchema: PageGoForwardActionSchema,
    execute: async ({ params }) => {
      return PageNavigationResultSchema.parse(
        buildStubNavigationResult(`https://stub.invalid/${getPageId(params)}`),
      );
    },
  }),
};

export default goForwardRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/goto.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageGotoActionSchema,
  PageNavigationResultSchema,
  PageGotoRequestSchema,
  PageGotoResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  buildStubNavigationResult,
  createPageActionHandler,
  pageErrorResponses,
} from "./shared.js";

const gotoRoute: RouteOptions = {
  method: "POST",
  url: "/page/goto",
  schema: {
    operationId: "PageGoto",
    summary: "page.goto",
    headers: Api.SessionHeadersSchema,
    body: PageGotoRequestSchema,
    response: {
      200: PageGotoResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "goto",
    actionSchema: PageGotoActionSchema,
    execute: async ({ params }) => {
      return PageNavigationResultSchema.parse(
        buildStubNavigationResult(params.url),
      );
    },
  }),
};

export default gotoRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/hover.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageHoverActionSchema,
  PageHoverRequestSchema,
  PageHoverResponseSchema,
  PageXPathResultSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const hoverRoute: RouteOptions = {
  method: "POST",
  url: "/page/hover",
  schema: {
    operationId: "PageHover",
    summary: "page.hover",
    headers: Api.SessionHeadersSchema,
    body: PageHoverRequestSchema,
    response: {
      200: PageHoverResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "hover",
    actionSchema: PageHoverActionSchema,
    execute: async ({ params }) => {
      const sel = params.selector;
      return PageXPathResultSchema.parse({
        xpath: "xpath" in sel ? sel.xpath : "xpath=//stub-hover",
      });
    },
  }),
};

export default hoverRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/keyPress.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageKeyPressActionSchema,
  PageKeyPressResultSchema,
  PageKeyPressRequestSchema,
  PageKeyPressResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const keyPressRoute: RouteOptions = {
  method: "POST",
  url: "/page/keyPress",
  schema: {
    operationId: "PageKeyPress",
    summary: "page.keyPress",
    headers: Api.SessionHeadersSchema,
    body: PageKeyPressRequestSchema,
    response: {
      200: PageKeyPressResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "keyPress",
    actionSchema: PageKeyPressActionSchema,
    execute: async ({ params }) => {
      return PageKeyPressResultSchema.parse({ key: params.key });
    },
  }),
};

export default keyPressRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/listAllFrameIds.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageListAllFrameIdsActionSchema,
  PageListAllFrameIdsResultSchema,
  PageListAllFrameIdsRequestSchema,
  PageListAllFrameIdsResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const listAllFrameIdsRoute: RouteOptions = {
  method: "GET",
  url: "/page/listAllFrameIds",
  schema: {
    operationId: "PageListAllFrameIds",
    summary: "page.listAllFrameIds",
    headers: Api.SessionHeadersSchema,
    querystring: PageListAllFrameIdsRequestSchema,
    response: {
      200: PageListAllFrameIdsResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "listAllFrameIds",
    actionSchema: PageListAllFrameIdsActionSchema,
    execute: async () => {
      return PageListAllFrameIdsResultSchema.parse({
        frameIds: ["frame_stub"],
      });
    },
  }),
};

export default listAllFrameIdsRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/mainFrame.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageMainFrameActionSchema,
  PageMainFrameResultSchema,
  PageMainFrameRequestSchema,
  PageMainFrameResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  buildStubPageFrame,
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const mainFrameRoute: RouteOptions = {
  method: "GET",
  url: "/page/mainFrame",
  schema: {
    operationId: "PageMainFrame",
    summary: "page.mainFrame",
    headers: Api.SessionHeadersSchema,
    querystring: PageMainFrameRequestSchema,
    response: {
      200: PageMainFrameResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "mainFrame",
    actionSchema: PageMainFrameActionSchema,
    execute: async ({ params }) => {
      return PageMainFrameResultSchema.parse({
        frame: buildStubPageFrame(getPageId(params)),
      });
    },
  }),
};

export default mainFrameRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/mainFrameId.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageMainFrameIdActionSchema,
  PageMainFrameIdResultSchema,
  PageMainFrameIdRequestSchema,
  PageMainFrameIdResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const mainFrameIdRoute: RouteOptions = {
  method: "GET",
  url: "/page/mainFrameId",
  schema: {
    operationId: "PageMainFrameId",
    summary: "page.mainFrameId",
    headers: Api.SessionHeadersSchema,
    querystring: PageMainFrameIdRequestSchema,
    response: {
      200: PageMainFrameIdResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "mainFrameId",
    actionSchema: PageMainFrameIdActionSchema,
    execute: async () => {
      return PageMainFrameIdResultSchema.parse({ mainFrameId: "frame_stub" });
    },
  }),
};

export default mainFrameIdRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/reload.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageReloadActionSchema,
  PageNavigationResultSchema,
  PageReloadRequestSchema,
  PageReloadResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  buildStubNavigationResult,
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const reloadRoute: RouteOptions = {
  method: "POST",
  url: "/page/reload",
  schema: {
    operationId: "PageReload",
    summary: "page.reload",
    headers: Api.SessionHeadersSchema,
    body: PageReloadRequestSchema,
    response: {
      200: PageReloadResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "reload",
    actionSchema: PageReloadActionSchema,
    execute: async ({ params }) => {
      return PageNavigationResultSchema.parse(
        buildStubNavigationResult(`https://stub.invalid/${getPageId(params)}`),
      );
    },
  }),
};

export default reloadRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/routes.ts
================================================
import type { FastifyPluginCallback, RouteOptions } from "fastify";

import addInitScriptRoute from "./addInitScript.js";
import asProtocolFrameTreeRoute from "./asProtocolFrameTree.js";
import pageActionDetailsRoute from "./action/_actionId.js";
import pageActionListRoute from "./action/index.js";
import clickRoute from "./click.js";
import closeRoute from "./close.js";
import dragAndDropRoute from "./dragAndDrop.js";
import enableCursorOverlayRoute from "./enableCursorOverlay.js";
import evaluateRoute from "./evaluate.js";
import framesRoute from "./frames.js";
import getFullFrameTreeRoute from "./getFullFrameTree.js";
import getOrdinalRoute from "./getOrdinal.js";
import goBackRoute from "./goBack.js";
import goForwardRoute from "./goForward.js";
import gotoRoute from "./goto.js";
import hoverRoute from "./hover.js";
import keyPressRoute from "./keyPress.js";
import listAllFrameIdsRoute from "./listAllFrameIds.js";
import mainFrameRoute from "./mainFrame.js";
import mainFrameIdRoute from "./mainFrameId.js";
import screenshotRoute from "./screenshot.js";
import scrollRoute from "./scroll.js";
import sendCDPRoute from "./sendCDP.js";
import setExtraHTTPHeadersRoute from "./setExtraHTTPHeaders.js";
import setViewportSizeRoute from "./setViewportSize.js";
import snapshotRoute from "./snapshot.js";
import targetIdRoute from "./targetId.js";
import titleRoute from "./title.js";
import typeRoute from "./type.js";
import urlRoute from "./url.js";
import waitForLoadStateRoute from "./waitForLoadState.js";
import waitForMainLoadStateRoute from "./waitForMainLoadState.js";
import waitForSelectorRoute from "./waitForSelector.js";
import waitForTimeoutRoute from "./waitForTimeout.js";
import reloadRoute from "./reload.js";
import { buildErrorResponse } from "../../../schemas/v4/page.js";
import { normalizePluginError, withTag } from "../pluginUtils.js";

const rawPageRoutes: RouteOptions[] = [
  clickRoute,
  hoverRoute,
  scrollRoute,
  dragAndDropRoute,
  typeRoute,
  keyPressRoute,
  gotoRoute,
  reloadRoute,
  goBackRoute,
  goForwardRoute,
  closeRoute,
  enableCursorOverlayRoute,
  addInitScriptRoute,
  targetIdRoute,
  mainFrameIdRoute,
  mainFrameRoute,
  getFullFrameTreeRoute,
  asProtocolFrameTreeRoute,
  listAllFrameIdsRoute,
  getOrdinalRoute,
  titleRoute,
  urlRoute,
  framesRoute,
  setExtraHTTPHeadersRoute,
  waitForMainLoadStateRoute,
  screenshotRoute,
  snapshotRoute,
  setViewportSizeRoute,
  waitForLoadStateRoute,
  waitForSelectorRoute,
  waitForTimeoutRoute,
  evaluateRoute,
  sendCDPRoute,
  pageActionListRoute,
  pageActionDetailsRoute,
];

export const pageRoutes: RouteOptions[] = rawPageRoutes.map((route) =>
  withTag(route, "page"),
);

export const pageRoutesPlugin: FastifyPluginCallback = (
  instance,
  _opts,
  done,
) => {
  instance.setErrorHandler((error, _request, reply) => {
    const { errorMessage, stack, statusCode } = normalizePluginError(error);

    return reply.status(statusCode).send(
      buildErrorResponse({
        error: errorMessage,
        statusCode,
        stack,
      }),
    );
  });

  for (const route of pageRoutes) {
    instance.route(route);
  }

  done();
};


================================================
FILE: packages/server-v4/src/routes/v4/page/screenshot.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageScreenshotActionSchema,
  PageScreenshotResultSchema,
  PageScreenshotRequestSchema,
  PageScreenshotResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const screenshotRoute: RouteOptions = {
  method: "POST",
  url: "/page/screenshot",
  schema: {
    operationId: "PageScreenshot",
    summary: "page.screenshot",
    headers: Api.SessionHeadersSchema,
    body: PageScreenshotRequestSchema,
    response: {
      200: PageScreenshotResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "screenshot",
    actionSchema: PageScreenshotActionSchema,
    execute: async ({ params }) => {
      return PageScreenshotResultSchema.parse({
        base64: "c3R1Yg==",
        mimeType: params.type === "jpeg" ? "image/jpeg" : "image/png",
      });
    },
  }),
};

export default screenshotRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/scroll.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageScrollActionSchema,
  PageScrollRequestSchema,
  PageScrollResponseSchema,
  PageXPathResultSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const scrollRoute: RouteOptions = {
  method: "POST",
  url: "/page/scroll",
  schema: {
    operationId: "PageScroll",
    summary: "page.scroll",
    headers: Api.SessionHeadersSchema,
    body: PageScrollRequestSchema,
    response: {
      200: PageScrollResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "scroll",
    actionSchema: PageScrollActionSchema,
    execute: async ({ params }) => {
      const sel = params.selector;
      return PageXPathResultSchema.parse({
        xpath: "xpath" in sel ? sel.xpath : "xpath=//stub-scroll",
      });
    },
  }),
};

export default scrollRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/sendCDP.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageSendCDPActionSchema,
  PageSendCDPResultSchema,
  PageSendCDPRequestSchema,
  PageSendCDPResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const sendCDPRoute: RouteOptions = {
  method: "POST",
  url: "/page/sendCDP",
  schema: {
    operationId: "PageSendCDP",
    summary: "page.sendCDP",
    headers: Api.SessionHeadersSchema,
    body: PageSendCDPRequestSchema,
    response: {
      200: PageSendCDPResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "sendCDP",
    actionSchema: PageSendCDPActionSchema,
    execute: async ({ params }) => {
      return PageSendCDPResultSchema.parse({
        value: {
          method: params.method,
          params: params.params ?? null,
        },
      });
    },
  }),
};

export default sendCDPRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/setExtraHTTPHeaders.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageSetExtraHTTPHeadersActionSchema,
  PageSetExtraHTTPHeadersResultSchema,
  PageSetExtraHTTPHeadersRequestSchema,
  PageSetExtraHTTPHeadersResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const setExtraHTTPHeadersRoute: RouteOptions = {
  method: "POST",
  url: "/page/setExtraHTTPHeaders",
  schema: {
    operationId: "PageSetExtraHTTPHeaders",
    summary: "page.setExtraHTTPHeaders",
    headers: Api.SessionHeadersSchema,
    body: PageSetExtraHTTPHeadersRequestSchema,
    response: {
      200: PageSetExtraHTTPHeadersResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "setExtraHTTPHeaders",
    actionSchema: PageSetExtraHTTPHeadersActionSchema,
    execute: async ({ params }) => {
      return PageSetExtraHTTPHeadersResultSchema.parse({
        headers: params.headers,
      });
    },
  }),
};

export default setExtraHTTPHeadersRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/setViewportSize.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageSetViewportSizeActionSchema,
  PageSetViewportSizeResultSchema,
  PageSetViewportSizeRequestSchema,
  PageSetViewportSizeResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const setViewportSizeRoute: RouteOptions = {
  method: "POST",
  url: "/page/setViewportSize",
  schema: {
    operationId: "PageSetViewportSize",
    summary: "page.setViewportSize",
    headers: Api.SessionHeadersSchema,
    body: PageSetViewportSizeRequestSchema,
    response: {
      200: PageSetViewportSizeResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "setViewportSize",
    actionSchema: PageSetViewportSizeActionSchema,
    execute: async ({ params }) => {
      return PageSetViewportSizeResultSchema.parse({
        width: params.width,
        height: params.height,
        deviceScaleFactor: params.deviceScaleFactor,
      });
    },
  }),
};

export default setViewportSizeRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/shared.ts
================================================
import { randomUUID } from "node:crypto";

import type { RouteHandlerMethod } from "fastify";
import { StatusCodes } from "http-status-codes";
import { z } from "zod/v4";

import {
  type PageAction,
  PageTitleActionSchema,
  type PageActionDetailsQuery,
  type PageActionMethod,
  V4ErrorResponseSchema,
} from "../../../schemas/v4/page.js";

export const pageErrorResponses = {
  400: V4ErrorResponseSchema,
  401: V4ErrorResponseSchema,
  404: V4ErrorResponseSchema,
  408: V4ErrorResponseSchema,
  422: V4ErrorResponseSchema,
  500: V4ErrorResponseSchema,
};

type PageRequestBody<TAction extends PageAction> = {
  sessionId: string;
  params: TAction["params"];
};

type PageRequestQuery<TAction extends PageAction> = {
  id?: string;
  sessionId: string;
} & TAction["params"];

type PageActionHandlerContext<TAction extends PageAction> = {
  params: TAction["params"];
  request: Parameters<RouteHandlerMethod>[0];
  sessionId: string;
};

// Selector is a discriminated union of xpath, css, text, or coordinate types.
// Only xpath is fully resolved today; other types fall back to a stub xpath.
function normalizeXPath(xpath: string): string {
  return xpath.startsWith("xpath=") || xpath.startsWith("/")
    ? xpath
    : `xpath=${xpath}`;
}

export function getPageId(params: unknown): string | undefined {
  if (
    typeof params === "object" &&
    params !== null &&
    "pageId" in params &&
    typeof (params as { pageId?: unknown }).pageId === "string"
  ) {
    return (params as { pageId: string }).pageId;
  }

  return "page_stub";
}

export function buildStubPageFrame(pageId = "page_stub") {
  return {
    frameId: "frame_stub",
    pageId,
    sessionId: "cdp-session_stub",
    isBrowserRemote: false,
  };
}

export function buildStubNavigationResult(url = "https://stub.invalid") {
  return {
    url,
    response: {
      url,
      status: 200,
      statusText: "OK",
      ok: true,
      headers: {},
    },
  };
}

function extractPageParams<TAction extends PageAction>(
  input: PageRequestBody<TAction> | PageRequestQuery<TAction>,
): TAction["params"] {
  if ("params" in input) {
    return input.params;
  }

  const params = { ...input };
  delete (params as { id?: string }).id;
  delete (params as { sessionId?: string }).sessionId;
  return params as TAction["params"];
}

export function createPageActionHandler<TAction extends PageAction>(options: {
  actionSchema: z.ZodType<TAction>;
  execute: (
    ctx: PageActionHandlerContext<TAction>,
  ) => Promise<TAction["result"]>;
  method: PageActionMethod;
}): RouteHandlerMethod {
  const { actionSchema, method } = options;

  return async (request, reply) => {
    const input = (request.body ?? request.query) as
      | PageRequestBody<TAction>
      | PageRequestQuery<TAction>;
    const sessionId = input.sessionId ?? "session_stub";
    const params = extractPageParams(input);
    const result = await options.execute({
      params,
      request,
      sessionId,
    });
    const createdAt = new Date().toISOString();
    const action = actionSchema.parse({
      id: "id" in input ? (input.id ?? randomUUID()) : randomUUID(),
      method,
      status: "completed",
      sessionId,
      pageId: getPageId(params),
      createdAt,
      updatedAt: createdAt,
      completedAt: createdAt,
      error: null,
      params,
      result,
    });

    return reply.status(StatusCodes.OK).send({
      success: true,
      error: null,
      action,
    });
  };
}

export const pageActionDetailsHandler: RouteHandlerMethod = async (
  request,
  reply,
) => {
  const { actionId } = request.params as { actionId: string };
  const { sessionId } = request.query as PageActionDetailsQuery;
  const createdAt = new Date().toISOString();
  const action = PageTitleActionSchema.parse({
    id: actionId,
    method: "title",
    status: "completed",
    sessionId,
    pageId: "page_stub",
    createdAt,
    updatedAt: createdAt,
    completedAt: createdAt,
    error: null,
    params: {},
    result: { title: "Stub title" },
  });

  return reply.status(StatusCodes.OK).send({
    success: true,
    error: null,
    action,
  });
};

export const pageActionListHandler: RouteHandlerMethod = async (
  request,
  reply,
) => {
  const { sessionId } = request.query as PageActionDetailsQuery;
  const createdAt = new Date().toISOString();
  return reply.status(StatusCodes.OK).send({
    success: true,
    error: null,
    actions: [
      PageTitleActionSchema.parse({
        id: randomUUID(),
        method: "title",
        status: "completed",
        sessionId,
        pageId: "page_stub",
        createdAt,
        updatedAt: createdAt,
        completedAt: createdAt,
        error: null,
        params: {},
        result: { title: "Stub title" },
      }),
    ] as PageAction[],
  });
};

export { normalizeXPath };


================================================
FILE: packages/server-v4/src/routes/v4/page/snapshot.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageSnapshotActionSchema,
  PageSnapshotResultSchema,
  PageSnapshotRequestSchema,
  PageSnapshotResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const snapshotRoute: RouteOptions = {
  method: "POST",
  url: "/page/snapshot",
  schema: {
    operationId: "PageSnapshot",
    summary: "page.snapshot",
    headers: Api.SessionHeadersSchema,
    body: PageSnapshotRequestSchema,
    response: {
      200: PageSnapshotResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "snapshot",
    actionSchema: PageSnapshotActionSchema,
    execute: async () => {
      return PageSnapshotResultSchema.parse({
        formattedTree: "stub tree",
        xpathMap: { stub: "//html" },
        urlMap: { stub: "https://stub.invalid" },
      });
    },
  }),
};

export default snapshotRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/targetId.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageTargetIdActionSchema,
  PageTargetIdResultSchema,
  PageTargetIdRequestSchema,
  PageTargetIdResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const targetIdRoute: RouteOptions = {
  method: "GET",
  url: "/page/targetId",
  schema: {
    operationId: "PageTargetId",
    summary: "page.targetId",
    headers: Api.SessionHeadersSchema,
    querystring: PageTargetIdRequestSchema,
    response: {
      200: PageTargetIdResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "targetId",
    actionSchema: PageTargetIdActionSchema,
    execute: async ({ params }) => {
      return PageTargetIdResultSchema.parse({
        targetId: getPageId(params),
      });
    },
  }),
};

export default targetIdRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/title.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageTitleActionSchema,
  PageTitleResultSchema,
  PageTitleRequestSchema,
  PageTitleResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const titleRoute: RouteOptions = {
  method: "GET",
  url: "/page/title",
  schema: {
    operationId: "PageTitle",
    summary: "page.title",
    headers: Api.SessionHeadersSchema,
    querystring: PageTitleRequestSchema,
    response: {
      200: PageTitleResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "title",
    actionSchema: PageTitleActionSchema,
    execute: async () => {
      return PageTitleResultSchema.parse({ title: "Stub title" });
    },
  }),
};

export default titleRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/type.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageTypeActionSchema,
  PageTypeResultSchema,
  PageTypeRequestSchema,
  PageTypeResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const typeRoute: RouteOptions = {
  method: "POST",
  url: "/page/type",
  schema: {
    operationId: "PageType",
    summary: "page.type",
    headers: Api.SessionHeadersSchema,
    body: PageTypeRequestSchema,
    response: {
      200: PageTypeResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "type",
    actionSchema: PageTypeActionSchema,
    execute: async ({ params }) => {
      return PageTypeResultSchema.parse({ text: params.text });
    },
  }),
};

export default typeRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/url.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageUrlActionSchema,
  PageUrlResultSchema,
  PageUrlRequestSchema,
  PageUrlResponseSchema,
} from "../../../schemas/v4/page.js";
import {
  createPageActionHandler,
  getPageId,
  pageErrorResponses,
} from "./shared.js";

const urlRoute: RouteOptions = {
  method: "GET",
  url: "/page/url",
  schema: {
    operationId: "PageUrl",
    summary: "page.url",
    headers: Api.SessionHeadersSchema,
    querystring: PageUrlRequestSchema,
    response: {
      200: PageUrlResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "url",
    actionSchema: PageUrlActionSchema,
    execute: async ({ params }) => {
      return PageUrlResultSchema.parse({
        url: `https://stub.invalid/${getPageId(params)}`,
      });
    },
  }),
};

export default urlRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/waitForLoadState.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageWaitForLoadStateActionSchema,
  PageWaitForLoadStateResultSchema,
  PageWaitForLoadStateRequestSchema,
  PageWaitForLoadStateResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const waitForLoadStateRoute: RouteOptions = {
  method: "POST",
  url: "/page/waitForLoadState",
  schema: {
    operationId: "PageWaitForLoadState",
    summary: "page.waitForLoadState",
    headers: Api.SessionHeadersSchema,
    body: PageWaitForLoadStateRequestSchema,
    response: {
      200: PageWaitForLoadStateResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "waitForLoadState",
    actionSchema: PageWaitForLoadStateActionSchema,
    execute: async ({ params }) => {
      return PageWaitForLoadStateResultSchema.parse({
        state: params.state,
      });
    },
  }),
};

export default waitForLoadStateRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/waitForMainLoadState.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageWaitForMainLoadStateActionSchema,
  PageWaitForLoadStateResultSchema,
  PageWaitForMainLoadStateRequestSchema,
  PageWaitForMainLoadStateResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const waitForMainLoadStateRoute: RouteOptions = {
  method: "POST",
  url: "/page/waitForMainLoadState",
  schema: {
    operationId: "PageWaitForMainLoadState",
    summary: "page.waitForMainLoadState",
    headers: Api.SessionHeadersSchema,
    body: PageWaitForMainLoadStateRequestSchema,
    response: {
      200: PageWaitForMainLoadStateResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "waitForMainLoadState",
    actionSchema: PageWaitForMainLoadStateActionSchema,
    execute: async ({ params }) => {
      return PageWaitForLoadStateResultSchema.parse({
        state: params.state,
      });
    },
  }),
};

export default waitForMainLoadStateRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/waitForSelector.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageWaitForSelectorActionSchema,
  PageWaitForSelectorResultSchema,
  PageWaitForSelectorRequestSchema,
  PageWaitForSelectorResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const waitForSelectorRoute: RouteOptions = {
  method: "POST",
  url: "/page/waitForSelector",
  schema: {
    operationId: "PageWaitForSelector",
    summary: "page.waitForSelector",
    headers: Api.SessionHeadersSchema,
    body: PageWaitForSelectorRequestSchema,
    response: {
      200: PageWaitForSelectorResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "waitForSelector",
    actionSchema: PageWaitForSelectorActionSchema,
    execute: async ({ params }) => {
      return PageWaitForSelectorResultSchema.parse({
        selector: params.selector,
        matched: true,
      });
    },
  }),
};

export default waitForSelectorRoute;


================================================
FILE: packages/server-v4/src/routes/v4/page/waitForTimeout.ts
================================================
import type { RouteOptions } from "fastify";
import { Api } from "@browserbasehq/stagehand";
import type { FastifyZodOpenApiSchema } from "fastify-zod-openapi";

import {
  PageWaitForTimeoutActionSchema,
  PageWaitForTimeoutResultSchema,
  PageWaitForTimeoutRequestSchema,
  PageWaitForTimeoutResponseSchema,
} from "../../../schemas/v4/page.js";
import { createPageActionHandler, pageErrorResponses } from "./shared.js";

const waitForTimeoutRoute: RouteOptions = {
  method: "POST",
  url: "/page/waitForTimeout",
  schema: {
    operationId: "PageWaitForTimeout",
    summary: "page.waitForTimeout",
    headers: Api.SessionHeadersSchema,
    body: PageWaitForTimeoutRequestSchema,
    response: {
      200: PageWaitForTimeoutResponseSchema,
      ...pageErrorResponses,
    },
  } satisfies FastifyZodOpenApiSchema,
  handler: createPageActionHandler({
    method: "waitForTimeout",
    actionSchema: PageWaitForTimeoutActionSchema,
    execute: async ({ params }) => {
      return PageWaitForTimeoutResultSchema.parse({ ms: params.ms });
    },
  }),
};

export default waitForTimeoutRoute;


================================================
FILE: packages/server-v4/src/routes/v4/pluginUtils.ts
================================================
import type { RouteOptions } from "fastify";
import { ResponseSerializationError } from "fastify-zod-openapi";
import { StatusCodes } from "http-status-codes";

type TaggedRouteSchema = NonNullable<RouteOptions["schema"]> & {
  tags?: string[];
};

type ValidationLikeError = {
  validation: unknown[];
};

function isValidationLikeError(error: unknown): error is ValidationLikeError {
  return (
    typeof error === "object" &&
    error !== null &&
    "validation" in error &&
    Array.isArray((error as { validation?: unknown }).validation)
  );
}

function getErrorStatusCode(error: unknown): number {
  if (
    typeof error === "object" &&
    error !== null &&
    "statusCode" in error &&
    typeof (error as { statusCode?: unknown }).statusCode === "number"
  ) {
    return (error as { statusCode: number }).statusCode;
  }

  return StatusCodes.INTERNAL_SERVER_ERROR;
}

export function withTag(route: RouteOptions, tag: string): RouteOptions {
  if (!route.schema) {
    return route;
  }

  const schema = route.schema as TaggedRouteSchema;
  const tags = schema.tags ?? [];

  return {
    ...route,
    schema: {
      ...schema,
      tags: tags.includes(tag) ? tags : [...tags, tag],
    },
  };
}

export function normalizePluginError(error: unknown): {
  errorMessage: string;
  stack: string | null;
  statusCode: number;
} {
  if (isValidationLikeError(error)) {
    return {
      errorMessage: "Request validation failed",
      stack: null,
      statusCode: StatusCodes.BAD_REQUEST,
    };
  }

  if (error instanceof ResponseSerializationError) {
    return {
      errorMessage: "Response validation failed",
      stack: error.stack ?? null,
      statusCode: StatusCodes.INTERNAL_SERVER_ERROR,
    };
  }

  const normalizedError =
    error instanceof Error ? error : new Error(String(error));

  return {
    errorMessage: normalizedError.message,
    stack: normalizedError.stack ?? null,
    statusCode: getErrorStatusCode(error),
  };
}


================================================
FILE: packages/server-v4/src/schemas/v4/browserSession.ts
================================================
import { z } from "zod/v4";
import { Api } from "@browserbasehq/stagehand";
import {
  ActionIdSchema,
  FrameIdSchema,
  PageHeadersSchema,
  PageIdSchema,
  PageInitScriptSchema,
  RequestIdSchema,
  TimestampSchema,
} from "./page.js";

export const BrowserSessionIdSchema = z
  .string()
  .min(1)
  .meta({ id: "BrowserSessionId", example: "session_01JXAMPLE" });

export const BrowserSessionEnvSchema = z
  .enum(["LOCAL", "BROWSERBASE"])
  .meta({ id: "BrowserSessionEnv" });

export const BrowserSessionStatusSchema = z
  .enum(["running", "ended"])
  .meta({ id: "BrowserSessionStatus" });

export const BrowserSessionHeadersSchema = Api.SessionHeadersSchema.meta({
  id: "BrowserSessionHeaders",
});

export const BrowserSessionErrorResponseSchema = z
  .object({
    success: z.literal(false),
    message: z.string(),
  })
  .strict()
  .meta({ id: "BrowserSessionErrorResponse" });

const BrowserSessionCommonSchema = z
  .object({
    modelName: z.string().meta({
      description: "Model name to use for AI operations",
      example: "openai/gpt-4.1-nano",
    }),
    domSettleTimeoutMs: z.number().optional(),
    verbose: z.union([z.literal(0), z.literal(1), z.literal(2)]).optional(),
    systemPrompt: z.string().optional(),
    selfHeal: z.boolean().optional(),
    waitForCaptchaSolves: z.boolean().optional(),
    experimental: z.boolean().optional(),
    actTimeoutMs: z.number().optional(),
  })
  .strict();

const BrowserSessionLocalCreateSchema = BrowserSessionCommonSchema.extend({
  env: z.literal("LOCAL"),
  cdpUrl: z.string().optional(),
  localBrowserLaunchOptions: Api.LocalBrowserLaunchOptionsSchema.optional(),
})
  .strict()
  .superRefine((value, ctx) => {
    if (!value.cdpUrl && !value.localBrowserLaunchOptions) {
      ctx.addIssue({
        code: z.ZodIssueCode.custom,
        path: ["localBrowserLaunchOptions"],
        message:
          "When env is LOCAL, provide either cdpUrl or localBrowserLaunchOptions.",
      });
    }
  })
  .meta({ id: "BrowserSessionLocalCreateRequest" });

const BrowserSessionBrowserbaseCreateSchema = BrowserSessionCommonSchema.extend(
  {
    env: z.literal("BROWSERBASE"),
    browserbaseSessionId: z.string().optional(),
    browserbaseSessionCreateParams:
      Api.BrowserbaseSessionCreateParamsSchema.optional(),
  },
)
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseCreateRequest" });

export const BrowserSessionCreateRequestSchema = z
  .discriminatedUnion("env", [
    BrowserSessionLocalCreateSchema,
    BrowserSessionBrowserbaseCreateSchema,
  ])
  .meta({ id: "BrowserSessionCreateRequest" });

export const BrowserSessionIdParamsSchema = z
  .object({
    id: BrowserSessionIdSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionIdParams" });

export const BrowserSessionEndRequestSchema = z
  .object({})
  .strict()
  .optional()
  .meta({ id: "BrowserSessionEndRequest" });

export const BrowserSessionSchema = z
  .object({
    id: BrowserSessionIdSchema,
    env: BrowserSessionEnvSchema,
    status: BrowserSessionStatusSchema,
    modelName: z.string(),
    cdpUrl: z.string().nullish(),
    available: z.boolean(),
    browserbaseSessionId: z.string().optional(),
    browserbaseSessionCreateParams:
      Api.BrowserbaseSessionCreateParamsSchema.optional(),
    localBrowserLaunchOptions: Api.LocalBrowserLaunchOptionsSchema.optional(),
    domSettleTimeoutMs: z.number().optional(),
    verbose: z.union([z.literal(0), z.literal(1), z.literal(2)]).optional(),
    systemPrompt: z.string().optional(),
    selfHeal: z.boolean().optional(),
    waitForCaptchaSolves: z.boolean().optional(),
    experimental: z.boolean().optional(),
    actTimeoutMs: z.number().optional(),
  })
  .strict()
  .meta({ id: "BrowserSession" });

export const BrowserSessionResultSchema = z
  .object({
    browserSession: BrowserSessionSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionResult" });

export const BrowserSessionResponseSchema = z
  .object({
    success: z.literal(true),
    data: BrowserSessionResultSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionResponse" });

export const BrowserSessionActionMethodSchema = z
  .enum([
    "addInitScript",
    "setExtraHTTPHeaders",
    "pages",
    "activePage",
    "awaitActivePage",
    "resolvePageByMainFrameId",
    "getFullFrameTreeByMainFrameId",
    "newPage",
    "cookies",
    "addCookies",
    "clearCookies",
    "connectURL",
    "configuredViewport",
    "browserbaseSessionID",
    "browserbaseSessionURL",
    "browserbaseDebugURL",
    "isBrowserbase",
    "isAdvancedStealth",
    "setViewportSize",
    "close",
  ])
  .meta({ id: "BrowserSessionActionMethod" });

export const BrowserSessionActionStatusSchema = z
  .enum(["queued", "running", "completed", "failed", "canceled"])
  .meta({ id: "BrowserSessionActionStatus" });

export const BrowserSessionPageSchema = z
  .object({
    pageId: PageIdSchema,
    targetId: PageIdSchema,
    mainFrameId: FrameIdSchema,
    url: z.string(),
  })
  .strict()
  .meta({ id: "BrowserSessionPage" });

export const BrowserSessionCookieSchema = z
  .object({
    name: z.string(),
    value: z.string(),
    domain: z.string(),
    path: z.string(),
    expires: z.number(),
    httpOnly: z.boolean(),
    secure: z.boolean(),
    sameSite: z.enum(["Strict", "Lax", "None"]),
  })
  .strict()
  .meta({ id: "BrowserSessionCookie" });

export const BrowserSessionCookieParamSchema = z
  .object({
    name: z.string(),
    value: z.string(),
    url: z.string().optional(),
    domain: z.string().optional(),
    path: z.string().optional(),
    expires: z.number().optional(),
    httpOnly: z.boolean().optional(),
    secure: z.boolean().optional(),
    sameSite: z.enum(["Strict", "Lax", "None"]).optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionCookieParam" });

export const BrowserSessionRegexSchema = z
  .object({
    source: z.string(),
    flags: z.string().optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionRegex" });

export const BrowserSessionStringPatternSchema = z
  .union([z.string(), BrowserSessionRegexSchema])
  .meta({ id: "BrowserSessionStringPattern" });

export const BrowserSessionClearCookiesOptionsSchema = z
  .object({
    name: BrowserSessionStringPatternSchema.optional(),
    domain: BrowserSessionStringPatternSchema.optional(),
    path: BrowserSessionStringPatternSchema.optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionClearCookiesOptions" });

export const BrowserSessionViewportSchema = z
  .object({
    width: z.number().positive(),
    height: z.number().positive(),
    deviceScaleFactor: z.number().positive().optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionViewport" });

const BrowserSessionBodySchema = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: BrowserSessionIdSchema,
  })
  .strict();

const BrowserSessionActionBaseSchema = z
  .object({
    id: ActionIdSchema,
    method: BrowserSessionActionMethodSchema,
    status: BrowserSessionActionStatusSchema,
    sessionId: BrowserSessionIdSchema,
    pageId: PageIdSchema.optional(),
    createdAt: TimestampSchema,
    updatedAt: TimestampSchema,
    completedAt: TimestampSchema.optional(),
    error: z.string().nullable(),
  })
  .strict()
  .meta({ id: "BrowserSessionActionBase" });

function createBrowserSessionRequestSchema<T extends z.ZodTypeAny>(
  id: string,
  params: T,
) {
  return BrowserSessionBodySchema.extend({ params }).meta({ id });
}

function createBrowserSessionActionSchema<
  TMethod extends BrowserSessionActionMethod,
  TParams extends z.ZodTypeAny,
  TResult extends z.ZodTypeAny,
>(id: string, method: TMethod, params: TParams, result: TResult) {
  return BrowserSessionActionBaseSchema.extend({
    method: z.literal(method),
    params,
    result: result.nullable(),
  }).meta({ id });
}

function createBrowserSessionResponseSchema<T extends z.ZodTypeAny>(
  id: string,
  action: T,
) {
  return z
    .object({
      success: z.literal(true),
      error: z.null(),
      action,
    })
    .strict()
    .meta({ id });
}

export const BrowserSessionAddInitScriptParamsSchema = z
  .object({
    script: PageInitScriptSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionAddInitScriptParams" });

export const BrowserSessionSetExtraHTTPHeadersParamsSchema = z
  .object({
    headers: PageHeadersSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionSetExtraHTTPHeadersParams" });

export const BrowserSessionPagesParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionPagesParams" });

export const BrowserSessionActivePageParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionActivePageParams" });

export const BrowserSessionAwaitActivePageParamsSchema = z
  .object({
    timeoutMs: z.number().int().nonnegative().optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionAwaitActivePageParams" });

export const BrowserSessionResolvePageByMainFrameIdParamsSchema = z
  .object({
    mainFrameId: FrameIdSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionResolvePageByMainFrameIdParams" });

export const BrowserSessionGetFullFrameTreeByMainFrameIdParamsSchema = z
  .object({
    mainFrameId: FrameIdSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionGetFullFrameTreeByMainFrameIdParams" });

export const BrowserSessionNewPageParamsSchema = z
  .object({
    url: z.string().optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionNewPageParams" });

export const BrowserSessionCookiesParamsSchema = z
  .object({
    urls: z.union([z.string(), z.array(z.string())]).optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionCookiesParams" });

export const BrowserSessionAddCookiesParamsSchema = z
  .object({
    cookies: z.array(BrowserSessionCookieParamSchema),
  })
  .strict()
  .meta({ id: "BrowserSessionAddCookiesParams" });

export const BrowserSessionClearCookiesParamsSchema =
  BrowserSessionClearCookiesOptionsSchema.meta({
    id: "BrowserSessionClearCookiesParams",
  });

export const BrowserSessionConnectURLParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionConnectURLParams" });

export const BrowserSessionConfiguredViewportParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionConfiguredViewportParams" });

export const BrowserSessionBrowserbaseSessionIDParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseSessionIDParams" });

export const BrowserSessionBrowserbaseSessionURLParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseSessionURLParams" });

export const BrowserSessionBrowserbaseDebugURLParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseDebugURLParams" });

export const BrowserSessionIsBrowserbaseParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionIsBrowserbaseParams" });

export const BrowserSessionIsAdvancedStealthParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionIsAdvancedStealthParams" });

export const BrowserSessionSetViewportSizeParamsSchema =
  BrowserSessionViewportSchema.meta({
    id: "BrowserSessionSetViewportSizeParams",
  });

export const BrowserSessionCloseParamsSchema = z
  .object({})
  .strict()
  .meta({ id: "BrowserSessionCloseParams" });

export const BrowserSessionAddInitScriptRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionAddInitScriptRequest",
    BrowserSessionAddInitScriptParamsSchema,
  );

export const BrowserSessionSetExtraHTTPHeadersRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionSetExtraHTTPHeadersRequest",
    BrowserSessionSetExtraHTTPHeadersParamsSchema,
  );

export const BrowserSessionPagesRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionPagesRequest",
    BrowserSessionPagesParamsSchema,
  );

export const BrowserSessionActivePageRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionActivePageRequest",
    BrowserSessionActivePageParamsSchema,
  );

export const BrowserSessionAwaitActivePageRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionAwaitActivePageRequest",
    BrowserSessionAwaitActivePageParamsSchema,
  );

export const BrowserSessionResolvePageByMainFrameIdRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionResolvePageByMainFrameIdRequest",
    BrowserSessionResolvePageByMainFrameIdParamsSchema,
  );

export const BrowserSessionGetFullFrameTreeByMainFrameIdRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionGetFullFrameTreeByMainFrameIdRequest",
    BrowserSessionGetFullFrameTreeByMainFrameIdParamsSchema,
  );

export const BrowserSessionNewPageRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionNewPageRequest",
    BrowserSessionNewPageParamsSchema,
  );

export const BrowserSessionCookiesRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionCookiesRequest",
    BrowserSessionCookiesParamsSchema,
  );

export const BrowserSessionAddCookiesRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionAddCookiesRequest",
    BrowserSessionAddCookiesParamsSchema,
  );

export const BrowserSessionClearCookiesRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionClearCookiesRequest",
    BrowserSessionClearCookiesParamsSchema,
  );

export const BrowserSessionConnectURLRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionConnectURLRequest",
    BrowserSessionConnectURLParamsSchema,
  );

export const BrowserSessionConfiguredViewportRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionConfiguredViewportRequest",
    BrowserSessionConfiguredViewportParamsSchema,
  );

export const BrowserSessionBrowserbaseSessionIDRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionBrowserbaseSessionIDRequest",
    BrowserSessionBrowserbaseSessionIDParamsSchema,
  );

export const BrowserSessionBrowserbaseSessionURLRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionBrowserbaseSessionURLRequest",
    BrowserSessionBrowserbaseSessionURLParamsSchema,
  );

export const BrowserSessionBrowserbaseDebugURLRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionBrowserbaseDebugURLRequest",
    BrowserSessionBrowserbaseDebugURLParamsSchema,
  );

export const BrowserSessionIsBrowserbaseRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionIsBrowserbaseRequest",
    BrowserSessionIsBrowserbaseParamsSchema,
  );

export const BrowserSessionIsAdvancedStealthRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionIsAdvancedStealthRequest",
    BrowserSessionIsAdvancedStealthParamsSchema,
  );

export const BrowserSessionSetViewportSizeRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionSetViewportSizeRequest",
    BrowserSessionSetViewportSizeParamsSchema,
  );

export const BrowserSessionCloseRequestSchema =
  createBrowserSessionRequestSchema(
    "BrowserSessionCloseRequest",
    BrowserSessionCloseParamsSchema,
  );

export const BrowserSessionAddInitScriptResultSchema = z
  .object({
    added: z.boolean(),
  })
  .strict()
  .meta({ id: "BrowserSessionAddInitScriptResult" });

export const BrowserSessionSetExtraHTTPHeadersResultSchema = z
  .object({
    headers: PageHeadersSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionSetExtraHTTPHeadersResult" });

export const BrowserSessionPagesResultSchema = z
  .object({
    pages: z.array(BrowserSessionPageSchema),
  })
  .strict()
  .meta({ id: "BrowserSessionPagesResult" });

export const BrowserSessionOptionalPageResultSchema = z
  .object({
    page: BrowserSessionPageSchema.nullable(),
  })
  .strict()
  .meta({ id: "BrowserSessionOptionalPageResult" });

export const BrowserSessionPageResultSchema = z
  .object({
    page: BrowserSessionPageSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionPageResult" });

export const BrowserSessionFrameTreeResultSchema = z
  .object({
    frameTree: z.unknown(),
  })
  .strict()
  .meta({ id: "BrowserSessionFrameTreeResult" });

export const BrowserSessionCookiesResultSchema = z
  .object({
    cookies: z.array(BrowserSessionCookieSchema),
  })
  .strict()
  .meta({ id: "BrowserSessionCookiesResult" });

export const BrowserSessionAddCookiesResultSchema = z
  .object({
    added: z.number().int().nonnegative(),
  })
  .strict()
  .meta({ id: "BrowserSessionAddCookiesResult" });

export const BrowserSessionClearCookiesResultSchema = z
  .object({
    cleared: z.boolean(),
  })
  .strict()
  .meta({ id: "BrowserSessionClearCookiesResult" });

export const BrowserSessionConnectURLResultSchema = z
  .object({
    connectURL: z.string(),
  })
  .strict()
  .meta({ id: "BrowserSessionConnectURLResult" });

export const BrowserSessionConfiguredViewportResultSchema =
  BrowserSessionViewportSchema.meta({
    id: "BrowserSessionConfiguredViewportResult",
  });

export const BrowserSessionBrowserbaseSessionIDResultSchema = z
  .object({
    browserbaseSessionID: z.string().nullable(),
  })
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseSessionIDResult" });

export const BrowserSessionBrowserbaseSessionURLResultSchema = z
  .object({
    browserbaseSessionURL: z.string().nullable(),
  })
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseSessionURLResult" });

export const BrowserSessionBrowserbaseDebugURLResultSchema = z
  .object({
    browserbaseDebugURL: z.string().nullable(),
  })
  .strict()
  .meta({ id: "BrowserSessionBrowserbaseDebugURLResult" });

export const BrowserSessionIsBrowserbaseResultSchema = z
  .object({
    isBrowserbase: z.boolean(),
  })
  .strict()
  .meta({ id: "BrowserSessionIsBrowserbaseResult" });

export const BrowserSessionIsAdvancedStealthResultSchema = z
  .object({
    isAdvancedStealth: z.boolean(),
  })
  .strict()
  .meta({ id: "BrowserSessionIsAdvancedStealthResult" });

export const BrowserSessionSetViewportSizeResultSchema =
  BrowserSessionViewportSchema.meta({
    id: "BrowserSessionSetViewportSizeResult",
  });

export const BrowserSessionCloseResultSchema = z
  .object({
    closed: z.boolean(),
  })
  .strict()
  .meta({ id: "BrowserSessionCloseResult" });

export const BrowserSessionAddInitScriptActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionAddInitScriptAction",
    "addInitScript",
    BrowserSessionAddInitScriptParamsSchema,
    BrowserSessionAddInitScriptResultSchema,
  );

export const BrowserSessionSetExtraHTTPHeadersActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionSetExtraHTTPHeadersAction",
    "setExtraHTTPHeaders",
    BrowserSessionSetExtraHTTPHeadersParamsSchema,
    BrowserSessionSetExtraHTTPHeadersResultSchema,
  );

export const BrowserSessionPagesActionSchema = createBrowserSessionActionSchema(
  "BrowserSessionPagesAction",
  "pages",
  BrowserSessionPagesParamsSchema,
  BrowserSessionPagesResultSchema,
);

export const BrowserSessionActivePageActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionActivePageAction",
    "activePage",
    BrowserSessionActivePageParamsSchema,
    BrowserSessionOptionalPageResultSchema,
  );

export const BrowserSessionAwaitActivePageActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionAwaitActivePageAction",
    "awaitActivePage",
    BrowserSessionAwaitActivePageParamsSchema,
    BrowserSessionPageResultSchema,
  );

export const BrowserSessionResolvePageByMainFrameIdActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionResolvePageByMainFrameIdAction",
    "resolvePageByMainFrameId",
    BrowserSessionResolvePageByMainFrameIdParamsSchema,
    BrowserSessionOptionalPageResultSchema,
  );

export const BrowserSessionGetFullFrameTreeByMainFrameIdActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionGetFullFrameTreeByMainFrameIdAction",
    "getFullFrameTreeByMainFrameId",
    BrowserSessionGetFullFrameTreeByMainFrameIdParamsSchema,
    BrowserSessionFrameTreeResultSchema,
  );

export const BrowserSessionNewPageActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionNewPageAction",
    "newPage",
    BrowserSessionNewPageParamsSchema,
    BrowserSessionPageResultSchema,
  );

export const BrowserSessionCookiesActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionCookiesAction",
    "cookies",
    BrowserSessionCookiesParamsSchema,
    BrowserSessionCookiesResultSchema,
  );

export const BrowserSessionAddCookiesActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionAddCookiesAction",
    "addCookies",
    BrowserSessionAddCookiesParamsSchema,
    BrowserSessionAddCookiesResultSchema,
  );

export const BrowserSessionClearCookiesActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionClearCookiesAction",
    "clearCookies",
    BrowserSessionClearCookiesParamsSchema,
    BrowserSessionClearCookiesResultSchema,
  );

export const BrowserSessionConnectURLActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionConnectURLAction",
    "connectURL",
    BrowserSessionConnectURLParamsSchema,
    BrowserSessionConnectURLResultSchema,
  );

export const BrowserSessionConfiguredViewportActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionConfiguredViewportAction",
    "configuredViewport",
    BrowserSessionConfiguredViewportParamsSchema,
    BrowserSessionConfiguredViewportResultSchema,
  );

export const BrowserSessionBrowserbaseSessionIDActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionBrowserbaseSessionIDAction",
    "browserbaseSessionID",
    BrowserSessionBrowserbaseSessionIDParamsSchema,
    BrowserSessionBrowserbaseSessionIDResultSchema,
  );

export const BrowserSessionBrowserbaseSessionURLActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionBrowserbaseSessionURLAction",
    "browserbaseSessionURL",
    BrowserSessionBrowserbaseSessionURLParamsSchema,
    BrowserSessionBrowserbaseSessionURLResultSchema,
  );

export const BrowserSessionBrowserbaseDebugURLActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionBrowserbaseDebugURLAction",
    "browserbaseDebugURL",
    BrowserSessionBrowserbaseDebugURLParamsSchema,
    BrowserSessionBrowserbaseDebugURLResultSchema,
  );

export const BrowserSessionIsBrowserbaseActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionIsBrowserbaseAction",
    "isBrowserbase",
    BrowserSessionIsBrowserbaseParamsSchema,
    BrowserSessionIsBrowserbaseResultSchema,
  );

export const BrowserSessionIsAdvancedStealthActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionIsAdvancedStealthAction",
    "isAdvancedStealth",
    BrowserSessionIsAdvancedStealthParamsSchema,
    BrowserSessionIsAdvancedStealthResultSchema,
  );

export const BrowserSessionSetViewportSizeActionSchema =
  createBrowserSessionActionSchema(
    "BrowserSessionSetViewportSizeAction",
    "setViewportSize",
    BrowserSessionSetViewportSizeParamsSchema,
    BrowserSessionSetViewportSizeResultSchema,
  );

export const BrowserSessionCloseActionSchema = createBrowserSessionActionSchema(
  "BrowserSessionCloseAction",
  "close",
  BrowserSessionCloseParamsSchema,
  BrowserSessionCloseResultSchema,
);

export const BrowserSessionActionSchema = z
  .union([
    BrowserSessionAddInitScriptActionSchema,
    BrowserSessionSetExtraHTTPHeadersActionSchema,
    BrowserSessionPagesActionSchema,
    BrowserSessionActivePageActionSchema,
    BrowserSessionAwaitActivePageActionSchema,
    BrowserSessionResolvePageByMainFrameIdActionSchema,
    BrowserSessionGetFullFrameTreeByMainFrameIdActionSchema,
    BrowserSessionNewPageActionSchema,
    BrowserSessionCookiesActionSchema,
    BrowserSessionAddCookiesActionSchema,
    BrowserSessionClearCookiesActionSchema,
    BrowserSessionConnectURLActionSchema,
    BrowserSessionConfiguredViewportActionSchema,
    BrowserSessionBrowserbaseSessionIDActionSchema,
    BrowserSessionBrowserbaseSessionURLActionSchema,
    BrowserSessionBrowserbaseDebugURLActionSchema,
    BrowserSessionIsBrowserbaseActionSchema,
    BrowserSessionIsAdvancedStealthActionSchema,
    BrowserSessionSetViewportSizeActionSchema,
    BrowserSessionCloseActionSchema,
  ])
  .meta({ id: "BrowserSessionAction" });

export const BrowserSessionV4ErrorResponseSchema = z
  .object({
    success: z.literal(false),
    error: z.string(),
    statusCode: z.number().int(),
    stack: z.string().nullable(),
    action: BrowserSessionActionSchema.optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionV4ErrorResponse" });

export const BrowserSessionAddInitScriptResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionAddInitScriptResponse",
    BrowserSessionAddInitScriptActionSchema,
  );

export const BrowserSessionSetExtraHTTPHeadersResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionSetExtraHTTPHeadersResponse",
    BrowserSessionSetExtraHTTPHeadersActionSchema,
  );

export const BrowserSessionPagesResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionPagesResponse",
    BrowserSessionPagesActionSchema,
  );

export const BrowserSessionActivePageResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionActivePageResponse",
    BrowserSessionActivePageActionSchema,
  );

export const BrowserSessionAwaitActivePageResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionAwaitActivePageResponse",
    BrowserSessionAwaitActivePageActionSchema,
  );

export const BrowserSessionResolvePageByMainFrameIdResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionResolvePageByMainFrameIdResponse",
    BrowserSessionResolvePageByMainFrameIdActionSchema,
  );

export const BrowserSessionGetFullFrameTreeByMainFrameIdResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionGetFullFrameTreeByMainFrameIdResponse",
    BrowserSessionGetFullFrameTreeByMainFrameIdActionSchema,
  );

export const BrowserSessionNewPageResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionNewPageResponse",
    BrowserSessionNewPageActionSchema,
  );

export const BrowserSessionCookiesResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionCookiesResponse",
    BrowserSessionCookiesActionSchema,
  );

export const BrowserSessionAddCookiesResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionAddCookiesResponse",
    BrowserSessionAddCookiesActionSchema,
  );

export const BrowserSessionClearCookiesResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionClearCookiesResponse",
    BrowserSessionClearCookiesActionSchema,
  );

export const BrowserSessionConnectURLResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionConnectURLResponse",
    BrowserSessionConnectURLActionSchema,
  );

export const BrowserSessionConfiguredViewportResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionConfiguredViewportResponse",
    BrowserSessionConfiguredViewportActionSchema,
  );

export const BrowserSessionBrowserbaseSessionIDResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionBrowserbaseSessionIDResponse",
    BrowserSessionBrowserbaseSessionIDActionSchema,
  );

export const BrowserSessionBrowserbaseSessionURLResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionBrowserbaseSessionURLResponse",
    BrowserSessionBrowserbaseSessionURLActionSchema,
  );

export const BrowserSessionBrowserbaseDebugURLResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionBrowserbaseDebugURLResponse",
    BrowserSessionBrowserbaseDebugURLActionSchema,
  );

export const BrowserSessionIsBrowserbaseResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionIsBrowserbaseResponse",
    BrowserSessionIsBrowserbaseActionSchema,
  );

export const BrowserSessionIsAdvancedStealthResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionIsAdvancedStealthResponse",
    BrowserSessionIsAdvancedStealthActionSchema,
  );

export const BrowserSessionSetViewportSizeResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionSetViewportSizeResponse",
    BrowserSessionSetViewportSizeActionSchema,
  );

export const BrowserSessionCloseResponseSchema =
  createBrowserSessionResponseSchema(
    "BrowserSessionCloseResponse",
    BrowserSessionCloseActionSchema,
  );

export const BrowserSessionActionIdParamsSchema = z
  .object({
    actionId: ActionIdSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionActionIdParams" });

export const BrowserSessionActionDetailsQuerySchema = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: BrowserSessionIdSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionActionDetailsQuery" });

export const BrowserSessionActionListQuerySchema = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: BrowserSessionIdSchema,
    pageId: PageIdSchema.optional(),
    method: BrowserSessionActionMethodSchema.optional(),
    status: BrowserSessionActionStatusSchema.optional(),
    limit: z.coerce.number().int().positive().max(500).optional(),
  })
  .strict()
  .meta({ id: "BrowserSessionActionListQuery" });

export const BrowserSessionActionDetailsResponseSchema = z
  .object({
    success: z.literal(true),
    error: z.null(),
    action: BrowserSessionActionSchema,
  })
  .strict()
  .meta({ id: "BrowserSessionActionDetailsResponse" });

export const BrowserSessionActionListResponseSchema = z
  .object({
    success: z.literal(true),
    error: z.null(),
    actions: z.array(BrowserSessionActionSchema),
  })
  .strict()
  .meta({ id: "BrowserSessionActionListResponse" });

export const browserSessionOpenApiComponents = {
  schemas: {
    LocalBrowserLaunchOptions: Api.LocalBrowserLaunchOptionsSchema,
    BrowserbaseSessionCreateParams: Api.BrowserbaseSessionCreateParamsSchema,
    BrowserSessionHeaders: BrowserSessionHeadersSchema,
    BrowserSessionId: BrowserSessionIdSchema,
    BrowserSessionEnv: BrowserSessionEnvSchema,
    BrowserSessionStatus: BrowserSessionStatusSchema,
    BrowserSessionCreateRequest: BrowserSessionCreateRequestSchema,
    BrowserSessionIdParams: BrowserSessionIdParamsSchema,
    BrowserSessionEndRequest: BrowserSessionEndRequestSchema,
    BrowserSession: BrowserSessionSchema,
    BrowserSessionResult: BrowserSessionResultSchema,
    BrowserSessionResponse: BrowserSessionResponseSchema,
    BrowserSessionErrorResponse: BrowserSessionErrorResponseSchema,
    BrowserSessionActionMethod: BrowserSessionActionMethodSchema,
    BrowserSessionActionStatus: BrowserSessionActionStatusSchema,
    BrowserSessionPage: BrowserSessionPageSchema,
    BrowserSessionCookie: BrowserSessionCookieSchema,
    BrowserSessionCookieParam: BrowserSessionCookieParamSchema,
    BrowserSessionRegex: BrowserSessionRegexSchema,
    BrowserSessionStringPattern: BrowserSessionStringPatternSchema,
    BrowserSessionClearCookiesOptions: BrowserSessionClearCookiesOptionsSchema,
    BrowserSessionViewport: BrowserSessionViewportSchema,
    BrowserSessionActionBase: BrowserSessionActionBaseSchema,
    BrowserSessionAddInitScriptParams: BrowserSessionAddInitScriptParamsSchema,
    BrowserSessionSetExtraHTTPHeadersParams:
      BrowserSessionSetExtraHTTPHeadersParamsSchema,
    BrowserSessionPagesParams: BrowserSessionPagesParamsSchema,
    BrowserSessionActivePageParams: BrowserSessionActivePageParamsSchema,
    BrowserSessionAwaitActivePageParams:
      BrowserSessionAwaitActivePageParamsSchema,
    BrowserSessionResolvePageByMainFrameIdParams:
      BrowserSessionResolvePageByMainFrameIdParamsSchema,
    BrowserSessionGetFullFrameTreeByMainFrameIdParams:
      BrowserSessionGetFullFrameTreeByMainFrameIdParamsSchema,
    BrowserSessionNewPageParams: BrowserSessionNewPageParamsSchema,
    BrowserSessionCookiesParams: BrowserSessionCookiesParamsSchema,
    BrowserSessionAddCookiesParams: BrowserSessionAddCookiesParamsSchema,
    BrowserSessionClearCookiesParams: BrowserSessionClearCookiesParamsSchema,
    BrowserSessionConnectURLParams: BrowserSessionConnectURLParamsSchema,
    BrowserSessionConfiguredViewportParams:
      BrowserSessionConfiguredViewportParamsSchema,
    BrowserSessionBrowserbaseSessionIDParams:
      BrowserSessionBrowserbaseSessionIDParamsSchema,
    BrowserSessionBrowserbaseSessionURLParams:
      BrowserSessionBrowserbaseSessionURLParamsSchema,
    BrowserSessionBrowserbaseDebugURLParams:
      BrowserSessionBrowserbaseDebugURLParamsSchema,
    BrowserSessionIsBrowserbaseParams: BrowserSessionIsBrowserbaseParamsSchema,
    BrowserSessionIsAdvancedStealthParams:
      BrowserSessionIsAdvancedStealthParamsSchema,
    BrowserSessionSetViewportSizeParams:
      BrowserSessionSetViewportSizeParamsSchema,
    BrowserSessionCloseParams: BrowserSessionCloseParamsSchema,
    BrowserSessionAddInitScriptRequest:
      BrowserSessionAddInitScriptRequestSchema,
    BrowserSessionSetExtraHTTPHeadersRequest:
      BrowserSessionSetExtraHTTPHeadersRequestSchema,
    BrowserSessionPagesRequest: BrowserSessionPagesRequestSchema,
    BrowserSessionActivePageRequest: BrowserSessionActivePageRequestSchema,
    BrowserSessionAwaitActivePageRequest:
      BrowserSessionAwaitActivePageRequestSchema,
    BrowserSessionResolvePageByMainFrameIdRequest:
      BrowserSessionResolvePageByMainFrameIdRequestSchema,
    BrowserSessionGetFullFrameTreeByMainFrameIdRequest:
      BrowserSessionGetFullFrameTreeByMainFrameIdRequestSchema,
    BrowserSessionNewPageRequest: BrowserSessionNewPageRequestSchema,
    BrowserSessionCookiesRequest: BrowserSessionCookiesRequestSchema,
    BrowserSessionAddCookiesRequest: BrowserSessionAddCookiesRequestSchema,
    BrowserSessionClearCookiesRequest: BrowserSessionClearCookiesRequestSchema,
    BrowserSessionConnectURLRequest: BrowserSessionConnectURLRequestSchema,
    BrowserSessionConfiguredViewportRequest:
      BrowserSessionConfiguredViewportRequestSchema,
    BrowserSessionBrowserbaseSessionIDRequest:
      BrowserSessionBrowserbaseSessionIDRequestSchema,
    BrowserSessionBrowserbaseSessionURLRequest:
      BrowserSessionBrowserbaseSessionURLRequestSchema,
    BrowserSessionBrowserbaseDebugURLRequest:
      BrowserSessionBrowserbaseDebugURLRequestSchema,
    BrowserSessionIsBrowserbaseRequest:
      BrowserSessionIsBrowserbaseRequestSchema,
    BrowserSessionIsAdvancedStealthRequest:
      BrowserSessionIsAdvancedStealthRequestSchema,
    BrowserSessionSetViewportSizeRequest:
      BrowserSessionSetViewportSizeRequestSchema,
    BrowserSessionCloseRequest: BrowserSessionCloseRequestSchema,
    BrowserSessionAddInitScriptAction: BrowserSessionAddInitScriptActionSchema,
    BrowserSessionSetExtraHTTPHeadersAction:
      BrowserSessionSetExtraHTTPHeadersActionSchema,
    BrowserSessionPagesAction: BrowserSessionPagesActionSchema,
    BrowserSessionActivePageAction: BrowserSessionActivePageActionSchema,
    BrowserSessionAwaitActivePageAction:
      BrowserSessionAwaitActivePageActionSchema,
    BrowserSessionResolvePageByMainFrameIdAction:
      BrowserSessionResolvePageByMainFrameIdActionSchema,
    BrowserSessionGetFullFrameTreeByMainFrameIdAction:
      BrowserSessionGetFullFrameTreeByMainFrameIdActionSchema,
    BrowserSessionNewPageAction: BrowserSessionNewPageActionSchema,
    BrowserSessionCookiesAction: BrowserSessionCookiesActionSchema,
    BrowserSessionAddCookiesAction: BrowserSessionAddCookiesActionSchema,
    BrowserSessionClearCookiesAction: BrowserSessionClearCookiesActionSchema,
    BrowserSessionConnectURLAction: BrowserSessionConnectURLActionSchema,
    BrowserSessionConfiguredViewportAction:
      BrowserSessionConfiguredViewportActionSchema,
    BrowserSessionBrowserbaseSessionIDAction:
      BrowserSessionBrowserbaseSessionIDActionSchema,
    BrowserSessionBrowserbaseSessionURLAction:
      BrowserSessionBrowserbaseSessionURLActionSchema,
    BrowserSessionBrowserbaseDebugURLAction:
      BrowserSessionBrowserbaseDebugURLActionSchema,
    BrowserSessionIsBrowserbaseAction: BrowserSessionIsBrowserbaseActionSchema,
    BrowserSessionIsAdvancedStealthAction:
      BrowserSessionIsAdvancedStealthActionSchema,
    BrowserSessionSetViewportSizeAction:
      BrowserSessionSetViewportSizeActionSchema,
    BrowserSessionCloseAction: BrowserSessionCloseActionSchema,
    BrowserSessionAction: BrowserSessionActionSchema,
    BrowserSessionV4ErrorResponse: BrowserSessionV4ErrorResponseSchema,
    BrowserSessionAddInitScriptResponse:
      BrowserSessionAddInitScriptResponseSchema,
    BrowserSessionSetExtraHTTPHeadersResponse:
      BrowserSessionSetExtraHTTPHeadersResponseSchema,
    BrowserSessionPagesResponse: BrowserSessionPagesResponseSchema,
    BrowserSessionActivePageResponse: BrowserSessionActivePageResponseSchema,
    BrowserSessionAwaitActivePageResponse:
      BrowserSessionAwaitActivePageResponseSchema,
    BrowserSessionResolvePageByMainFrameIdResponse:
      BrowserSessionResolvePageByMainFrameIdResponseSchema,
    BrowserSessionGetFullFrameTreeByMainFrameIdResponse:
      BrowserSessionGetFullFrameTreeByMainFrameIdResponseSchema,
    BrowserSessionNewPageResponse: BrowserSessionNewPageResponseSchema,
    BrowserSessionCookiesResponse: BrowserSessionCookiesResponseSchema,
    BrowserSessionAddCookiesResponse: BrowserSessionAddCookiesResponseSchema,
    BrowserSessionClearCookiesResponse:
      BrowserSessionClearCookiesResponseSchema,
    BrowserSessionConnectURLResponse: BrowserSessionConnectURLResponseSchema,
    BrowserSessionConfiguredViewportResponse:
      BrowserSessionConfiguredViewportResponseSchema,
    BrowserSessionBrowserbaseSessionIDResponse:
      BrowserSessionBrowserbaseSessionIDResponseSchema,
    BrowserSessionBrowserbaseSessionURLResponse:
      BrowserSessionBrowserbaseSessionURLResponseSchema,
    BrowserSessionBrowserbaseDebugURLResponse:
      BrowserSessionBrowserbaseDebugURLResponseSchema,
    BrowserSessionIsBrowserbaseResponse:
      BrowserSessionIsBrowserbaseResponseSchema,
    BrowserSessionIsAdvancedStealthResponse:
      BrowserSessionIsAdvancedStealthResponseSchema,
    BrowserSessionSetViewportSizeResponse:
      BrowserSessionSetViewportSizeResponseSchema,
    BrowserSessionCloseResponse: BrowserSessionCloseResponseSchema,
    BrowserSessionActionIdParams: BrowserSessionActionIdParamsSchema,
    BrowserSessionActionDetailsQuery: BrowserSessionActionDetailsQuerySchema,
    BrowserSessionActionListQuery: BrowserSessionActionListQuerySchema,
    BrowserSessionActionDetailsResponse:
      BrowserSessionActionDetailsResponseSchema,
    BrowserSessionActionListResponse: BrowserSessionActionListResponseSchema,
  },
};

export type BrowserSessionCreateRequest = z.infer<
  typeof BrowserSessionCreateRequestSchema
>;
export type BrowserSessionIdParams = z.infer<
  typeof BrowserSessionIdParamsSchema
>;
export type BrowserSession = z.infer<typeof BrowserSessionSchema>;
export type BrowserSessionActionMethod = z.infer<
  typeof BrowserSessionActionMethodSchema
>;
export type BrowserSessionAction = z.infer<typeof BrowserSessionActionSchema>;
export type BrowserSessionActionDetailsQuery = z.infer<
  typeof BrowserSessionActionDetailsQuerySchema
>;
export type BrowserSessionActionListQuery = z.infer<
  typeof BrowserSessionActionListQuerySchema
>;
export type BrowserSessionPage = z.infer<typeof BrowserSessionPageSchema>;

export function buildBrowserSessionErrorResponse(input: {
  error: string;
  statusCode: number;
  stack?: string | null;
  action?: z.input<typeof BrowserSessionActionSchema>;
}) {
  return BrowserSessionV4ErrorResponseSchema.parse({
    success: false,
    error: input.error,
    statusCode: input.statusCode,
    stack: input.stack ?? null,
    ...(input.action ? { action: input.action } : {}),
  });
}


================================================
FILE: packages/server-v4/src/schemas/v4/page.ts
================================================
import { z } from "zod/v4";

export const RequestIdSchema = z
  .string()
  .min(1)
  .meta({ id: "RequestId", example: "req_01JXAMPLE" });

export const SessionIdSchema = z
  .string()
  .min(1)
  .meta({ id: "SessionId", example: "session_01JXAMPLE" });

export const PageIdSchema = z
  .string()
  .min(1)
  .meta({ id: "PageId", example: "target_01JXAMPLE" });

export const FrameIdSchema = z
  .string()
  .min(1)
  .meta({ id: "FrameId", example: "frame_01JXAMPLE" });

export const ActionIdSchema = z
  .string()
  .min(1)
  .meta({ id: "ActionId", example: "action_01JXAMPLE" });

export const CDPSessionIdSchema = z
  .string()
  .min(1)
  .meta({ id: "CDPSessionId", example: "cdp-session_01JXAMPLE" });

export const TimestampSchema = z
  .string()
  .datetime()
  .meta({ id: "Timestamp", example: "2026-02-03T12:00:00.000Z" });

export const MouseButtonSchema = z
  .enum(["left", "right", "middle"])
  .meta({ id: "MouseButton" });

export const LoadStateSchema = z
  .enum(["load", "domcontentloaded", "networkidle"])
  .meta({ id: "LoadState" });

export const WaitForSelectorStateSchema = z
  .enum(["attached", "detached", "visible", "hidden"])
  .meta({ id: "WaitForSelectorState" });

export const ScreenshotTypeSchema = z
  .enum(["png", "jpeg"])
  .meta({ id: "ScreenshotType" });

export const ScreenshotMimeTypeSchema = z
  .enum(["image/png", "image/jpeg"])
  .meta({ id: "ScreenshotMimeType" });

export const ScreenshotScaleSchema = z
  .enum(["css", "device"])
  .meta({ id: "ScreenshotScale" });

export const ScreenshotAnimationsSchema = z
  .enum(["allow", "disabled"])
  .meta({ id: "ScreenshotAnimations" });

export const ScreenshotCaretSchema = z
  .enum(["hide", "initial"])
  .meta({ id: "ScreenshotCaret" });

export const PageActionMethodSchema = z
  .enum([
    "click",
    "hover",
    "scroll",
    "dragAndDrop",
    "type",
    "keyPress",
    "enableCursorOverlay",
    "addInitScript",
    "goto",
    "reload",
    "goBack",
    "goForward",
    "targetId",
    "mainFrameId",
    "mainFrame",
    "getFullFrameTree",
    "asProtocolFrameTree",
    "listAllFrameIds",
    "getOrdinal",
    "title",
    "url",
    "screenshot",
    "snapshot",
    "frames",
    "setViewportSize",
    "setExtraHTTPHeaders",
    "waitForLoadState",
    "waitForMainLoadState",
    "waitForSelector",
    "waitForTimeout",
    "evaluate",
    "sendCDP",
    "close",
  ])
  .meta({ id: "PageActionMethod" });

export const PageActionStatusSchema = z
  .enum(["queued", "running", "completed", "failed", "canceled"])
  .meta({ id: "PageActionStatus" });

export const XPathSelectorSchema = z
  .object({
    xpath: z.string().min(1).meta({ example: "//button[text()='Submit']" }),
    idx: z.number().int().nonnegative().optional().meta({ example: 0 }),
  })
  .strict()
  .meta({ id: "XPathSelector" });

export const CssSelectorSchema = z
  .object({
    css: z.string().min(1).meta({ example: ".btn-submit" }),
    idx: z.number().int().nonnegative().optional().meta({ example: 0 }),
  })
  .strict()
  .meta({ id: "CssSelector" });

export const TextSelectorSchema = z
  .object({
    text: z.string().min(1).meta({ example: "Submit" }),
    idx: z.number().int().nonnegative().optional().meta({ example: 0 }),
  })
  .strict()
  .meta({ id: "TextSelector" });

export const CoordinateSelectorSchema = z
  .object({
    x: z.number(),
    y: z.number(),
  })
  .strict()
  .meta({ id: "CoordinateSelector" });

// Full union (all 4 types)
export const SelectorSchema = z
  .union([
    XPathSelectorSchema,
    CssSelectorSchema,
    TextSelectorSchema,
    CoordinateSelectorSchema,
  ])
  .meta({ id: "Selector" });

// Element-only (no coordinates) — for waitForSelector
export const ElementSelectorSchema = z
  .union([XPathSelectorSchema, CssSelectorSchema, TextSelectorSchema])
  .meta({ id: "ElementSelector" });

export const PageHeadersSchema = z
  .object({})
  .catchall(z.string())
  .meta({ id: "PageHeaders" });

export const PageInitScriptSchema = z
  .union([
    z.string().min(1),
    z
      .object({
        path: z.string().min(1).optional(),
        content: z.string().min(1).optional(),
      })
      .strict()
      .refine(
        (value) => value.path !== undefined || value.content !== undefined,
        {
          message: "script must include path or content",
        },
      ),
  ])
  .meta({ id: "PageInitScript" });

export const PageClipSchema = z
  .object({
    x: z.number(),
    y: z.number(),
    width: z.number().int().positive(),
    height: z.number().int().positive(),
  })
  .strict()
  .meta({ id: "PageClip" });

export const PageErrorSchema = z.string().min(1).meta({ id: "PageError" });

export const ValidationErrorResponseSchema = z
  .object({
    success: z.literal(false),
    error: PageErrorSchema,
    statusCode: z.number().int(),
    stack: z.string().nullable(),
    action: z.lazy(() => PageActionSchema).optional(),
  })
  .strict()
  .meta({ id: "ValidationErrorResponse" });

const PageBodySchema = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: SessionIdSchema,
  })
  .strict();

const PageQuerySchemaBase = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: SessionIdSchema,
  })
  .strict();

const PageWithPageIdSchema = z
  .object({
    pageId: PageIdSchema.optional(),
  })
  .strict();

const PageActionBaseSchema = z
  .object({
    id: ActionIdSchema,
    method: PageActionMethodSchema,
    status: PageActionStatusSchema,
    sessionId: SessionIdSchema,
    pageId: PageIdSchema.optional(),
    createdAt: TimestampSchema,
    updatedAt: TimestampSchema,
    completedAt: TimestampSchema.optional(),
    error: PageErrorSchema.nullable(),
  })
  .strict()
  .meta({ id: "PageActionBase" });

function createPageRequestSchema<T extends z.ZodTypeAny>(
  id: string,
  params: T,
) {
  return PageBodySchema.extend({ params }).meta({ id });
}

function createPageActionSchema<
  TMethod extends PageActionMethod,
  TParams extends z.ZodTypeAny,
  TResult extends z.ZodTypeAny,
>(id: string, method: TMethod, params: TParams, result: TResult) {
  return PageActionBaseSchema.extend({
    method: z.literal(method),
    params,
    result: result.nullable(),
  }).meta({ id });
}

function createPageResponseSchema<T extends z.ZodTypeAny>(
  id: string,
  action: T,
) {
  return z
    .object({
      success: z.literal(true),
      error: z.null(),
      action,
    })
    .strict()
    .meta({ id });
}

export const PageClickParamsSchema = PageWithPageIdSchema.extend({
  selector: SelectorSchema,
  button: MouseButtonSchema.optional(),
  clickCount: z.number().int().min(1).optional(),
})
  .strict()
  .meta({ id: "PageClickParams" });

export const PageHoverParamsSchema = PageWithPageIdSchema.extend({
  selector: SelectorSchema,
})
  .strict()
  .meta({ id: "PageHoverParams" });

export const PageScrollElementParamsSchema = PageWithPageIdSchema.extend({
  selector: ElementSelectorSchema,
  percentage: z.number().min(0).max(100),
})
  .strict()
  .meta({ id: "PageScrollElementParams" });

export const PageScrollCoordinateParamsSchema = PageWithPageIdSchema.extend({
  selector: CoordinateSelectorSchema,
  deltaX: z.number().optional(),
  deltaY: z.number(),
})
  .strict()
  .meta({ id: "PageScrollCoordinateParams" });

export const PageScrollParamsSchema = z
  .union([PageScrollElementParamsSchema, PageScrollCoordinateParamsSchema])
  .meta({ id: "PageScrollParams" });

export const PageDragAndDropParamsSchema = PageWithPageIdSchema.extend({
  from: SelectorSchema,
  to: SelectorSchema,
  button: MouseButtonSchema.optional(),
  steps: z.number().int().positive().optional(),
  delay: z.number().int().min(0).optional(),
})
  .strict()
  .meta({ id: "PageDragAndDropParams" });

export const PageTypeParamsSchema = PageWithPageIdSchema.extend({
  text: z.string(),
  delay: z.number().int().min(0).optional(),
  withMistakes: z.boolean().optional(),
})
  .strict()
  .meta({ id: "PageTypeParams" });

export const PageKeyPressParamsSchema = PageWithPageIdSchema.extend({
  key: z.string().min(1),
  delay: z.number().int().min(0).optional(),
})
  .strict()
  .meta({ id: "PageKeyPressParams" });

export const PageGotoParamsSchema = PageWithPageIdSchema.extend({
  url: z.string().url(),
  waitUntil: LoadStateSchema.optional(),
  timeoutMs: z.number().int().nonnegative().optional(),
})
  .strict()
  .meta({ id: "PageGotoParams" });

export const PageReloadParamsSchema = PageWithPageIdSchema.extend({
  waitUntil: LoadStateSchema.optional(),
  timeoutMs: z.number().int().nonnegative().optional(),
  ignoreCache: z.boolean().optional(),
})
  .strict()
  .meta({ id: "PageReloadParams" });

export const PageGoBackParamsSchema = PageWithPageIdSchema.extend({
  waitUntil: LoadStateSchema.optional(),
  timeoutMs: z.number().int().nonnegative().optional(),
})
  .strict()
  .meta({ id: "PageGoBackParams" });

export const PageGoForwardParamsSchema = PageWithPageIdSchema.extend({
  waitUntil: LoadStateSchema.optional(),
  timeoutMs: z.number().int().nonnegative().optional(),
})
  .strict()
  .meta({ id: "PageGoForwardParams" });

export const PageEnableCursorOverlayParamsSchema = PageWithPageIdSchema.meta({
  id: "PageEnableCursorOverlayParams",
});

export const PageAddInitScriptParamsSchema = PageWithPageIdSchema.extend({
  script: PageInitScriptSchema,
})
  .strict()
  .meta({ id: "PageAddInitScriptParams" });

export const PageTargetIdParamsSchema = PageWithPageIdSchema.meta({
  id: "PageTargetIdParams",
});

export const PageMainFrameIdParamsSchema = PageWithPageIdSchema.meta({
  id: "PageMainFrameIdParams",
});

export const PageMainFrameParamsSchema = PageWithPageIdSchema.meta({
  id: "PageMainFrameParams",
});

export const PageGetFullFrameTreeParamsSchema = PageWithPageIdSchema.meta({
  id: "PageGetFullFrameTreeParams",
});

export const PageAsProtocolFrameTreeParamsSchema = PageWithPageIdSchema.extend({
  rootMainFrameId: FrameIdSchema,
})
  .strict()
  .meta({ id: "PageAsProtocolFrameTreeParams" });

export const PageListAllFrameIdsParamsSchema = PageWithPageIdSchema.meta({
  id: "PageListAllFrameIdsParams",
});

export const PageGetOrdinalParamsSchema = PageWithPageIdSchema.extend({
  frameId: FrameIdSchema,
})
  .strict()
  .meta({ id: "PageGetOrdinalParams" });

export const PageTitleParamsSchema = PageWithPageIdSchema.meta({
  id: "PageTitleParams",
});

export const PageUrlParamsSchema = PageWithPageIdSchema.meta({
  id: "PageUrlParams",
});

export const PageScreenshotParamsSchema = PageWithPageIdSchema.extend({
  fullPage: z.boolean().optional(),
  clip: PageClipSchema.optional(),
  type: ScreenshotTypeSchema.optional(),
  quality: z.number().int().min(0).max(100).optional(),
  scale: ScreenshotScaleSchema.optional(),
  animations: ScreenshotAnimationsSchema.optional(),
  caret: ScreenshotCaretSchema.optional(),
  style: z.string().optional(),
  omitBackground: z.boolean().optional(),
  timeout: z.number().int().nonnegative().optional(),
})
  .strict()
  .superRefine((value, ctx) => {
    if (value.quality !== undefined && value.type !== "jpeg") {
      ctx.addIssue({
        code: z.ZodIssueCode.custom,
        path: ["quality"],
        message: "quality is only supported when type is 'jpeg'",
      });
    }

    if (value.clip && value.fullPage) {
      ctx.addIssue({
        code: z.ZodIssueCode.custom,
        path: ["clip"],
        message: "clip cannot be used together with fullPage",
      });
    }
  })
  .meta({ id: "PageScreenshotParams" });

export const PageSnapshotParamsSchema = PageWithPageIdSchema.extend({
  includeIframes: z.boolean().optional(),
})
  .strict()
  .meta({ id: "PageSnapshotParams" });

export const PageFramesParamsSchema = PageWithPageIdSchema.meta({
  id: "PageFramesParams",
});

export const PageSetViewportSizeParamsSchema = PageWithPageIdSchema.extend({
  width: z.number().positive(),
  height: z.number().positive(),
  deviceScaleFactor: z.number().positive().optional(),
})
  .strict()
  .meta({ id: "PageSetViewportSizeParams" });

export const PageSetExtraHTTPHeadersParamsSchema = PageWithPageIdSchema.extend({
  headers: PageHeadersSchema,
})
  .strict()
  .meta({ id: "PageSetExtraHTTPHeadersParams" });

export const PageWaitForLoadStateParamsSchema = PageWithPageIdSchema.extend({
  state: LoadStateSchema,
  timeoutMs: z.number().int().nonnegative().optional(),
})
  .strict()
  .meta({ id: "PageWaitForLoadStateParams" });

export const PageWaitForMainLoadStateParamsSchema = PageWithPageIdSchema.extend(
  {
    state: LoadStateSchema,
    timeoutMs: z.number().int().nonnegative().optional(),
  },
)
  .strict()
  .meta({ id: "PageWaitForMainLoadStateParams" });

export const PageWaitForSelectorParamsSchema = PageWithPageIdSchema.extend({
  selector: ElementSelectorSchema,
  state: WaitForSelectorStateSchema.optional(),
  timeout: z.number().int().nonnegative().optional(),
  pierceShadow: z.boolean().optional(),
})
  .strict()
  .meta({ id: "PageWaitForSelectorParams" });

export const PageWaitForTimeoutParamsSchema = PageWithPageIdSchema.extend({
  ms: z.number().int().nonnegative(),
})
  .strict()
  .meta({ id: "PageWaitForTimeoutParams" });

export const PageEvaluateParamsSchema = PageWithPageIdSchema.extend({
  expression: z.string().min(1),
  arg: z.unknown().optional(),
})
  .strict()
  .meta({ id: "PageEvaluateParams" });

export const PageSendCDPParamsSchema = PageWithPageIdSchema.extend({
  method: z.string().min(1),
  params: z.unknown().optional(),
})
  .strict()
  .meta({ id: "PageSendCDPParams" });

export const PageCloseParamsSchema = PageWithPageIdSchema.meta({
  id: "PageCloseParams",
});

export const PageClickRequestSchema = createPageRequestSchema(
  "PageClickRequest",
  PageClickParamsSchema,
);

export const PageHoverRequestSchema = createPageRequestSchema(
  "PageHoverRequest",
  PageHoverParamsSchema,
);

export const PageScrollRequestSchema = createPageRequestSchema(
  "PageScrollRequest",
  PageScrollParamsSchema,
);

export const PageDragAndDropRequestSchema = createPageRequestSchema(
  "PageDragAndDropRequest",
  PageDragAndDropParamsSchema,
);

export const PageTypeRequestSchema = createPageRequestSchema(
  "PageTypeRequest",
  PageTypeParamsSchema,
);

export const PageKeyPressRequestSchema = createPageRequestSchema(
  "PageKeyPressRequest",
  PageKeyPressParamsSchema,
);

export const PageGotoRequestSchema = createPageRequestSchema(
  "PageGotoRequest",
  PageGotoParamsSchema,
);

export const PageReloadRequestSchema = createPageRequestSchema(
  "PageReloadRequest",
  PageReloadParamsSchema,
);

export const PageGoBackRequestSchema = createPageRequestSchema(
  "PageGoBackRequest",
  PageGoBackParamsSchema,
);

export const PageGoForwardRequestSchema = createPageRequestSchema(
  "PageGoForwardRequest",
  PageGoForwardParamsSchema,
);

export const PageEnableCursorOverlayRequestSchema = createPageRequestSchema(
  "PageEnableCursorOverlayRequest",
  PageEnableCursorOverlayParamsSchema,
);

export const PageAddInitScriptRequestSchema = createPageRequestSchema(
  "PageAddInitScriptRequest",
  PageAddInitScriptParamsSchema,
);

export const PageTargetIdRequestSchema = PageQuerySchemaBase.extend(
  PageTargetIdParamsSchema.shape,
).meta({ id: "PageTargetIdRequest" });

export const PageMainFrameIdRequestSchema = PageQuerySchemaBase.extend(
  PageMainFrameIdParamsSchema.shape,
).meta({ id: "PageMainFrameIdRequest" });

export const PageMainFrameRequestSchema = PageQuerySchemaBase.extend(
  PageMainFrameParamsSchema.shape,
).meta({ id: "PageMainFrameRequest" });

export const PageGetFullFrameTreeRequestSchema = PageQuerySchemaBase.extend(
  PageGetFullFrameTreeParamsSchema.shape,
).meta({ id: "PageGetFullFrameTreeRequest" });

export const PageAsProtocolFrameTreeRequestSchema = PageQuerySchemaBase.extend(
  PageAsProtocolFrameTreeParamsSchema.shape,
).meta({ id: "PageAsProtocolFrameTreeRequest" });

export const PageListAllFrameIdsRequestSchema = PageQuerySchemaBase.extend(
  PageListAllFrameIdsParamsSchema.shape,
).meta({ id: "PageListAllFrameIdsRequest" });

export const PageGetOrdinalRequestSchema = PageQuerySchemaBase.extend(
  PageGetOrdinalParamsSchema.shape,
).meta({ id: "PageGetOrdinalRequest" });

export const PageTitleRequestSchema = PageQuerySchemaBase.extend(
  PageTitleParamsSchema.shape,
).meta({ id: "PageTitleRequest" });

export const PageUrlRequestSchema = PageQuerySchemaBase.extend(
  PageUrlParamsSchema.shape,
).meta({ id: "PageUrlRequest" });

export const PageScreenshotRequestSchema = createPageRequestSchema(
  "PageScreenshotRequest",
  PageScreenshotParamsSchema,
);

export const PageSnapshotRequestSchema = createPageRequestSchema(
  "PageSnapshotRequest",
  PageSnapshotParamsSchema,
);

export const PageFramesRequestSchema = PageQuerySchemaBase.extend(
  PageFramesParamsSchema.shape,
).meta({ id: "PageFramesRequest" });

export const PageSetViewportSizeRequestSchema = createPageRequestSchema(
  "PageSetViewportSizeRequest",
  PageSetViewportSizeParamsSchema,
);

export const PageSetExtraHTTPHeadersRequestSchema = createPageRequestSchema(
  "PageSetExtraHTTPHeadersRequest",
  PageSetExtraHTTPHeadersParamsSchema,
);

export const PageWaitForLoadStateRequestSchema = createPageRequestSchema(
  "PageWaitForLoadStateRequest",
  PageWaitForLoadStateParamsSchema,
);

export const PageWaitForMainLoadStateRequestSchema = createPageRequestSchema(
  "PageWaitForMainLoadStateRequest",
  PageWaitForMainLoadStateParamsSchema,
);

export const PageWaitForSelectorRequestSchema = createPageRequestSchema(
  "PageWaitForSelectorRequest",
  PageWaitForSelectorParamsSchema,
);

export const PageWaitForTimeoutRequestSchema = createPageRequestSchema(
  "PageWaitForTimeoutRequest",
  PageWaitForTimeoutParamsSchema,
);

export const PageEvaluateRequestSchema = createPageRequestSchema(
  "PageEvaluateRequest",
  PageEvaluateParamsSchema,
);

export const PageSendCDPRequestSchema = createPageRequestSchema(
  "PageSendCDPRequest",
  PageSendCDPParamsSchema,
);

export const PageCloseRequestSchema = createPageRequestSchema(
  "PageCloseRequest",
  PageCloseParamsSchema,
);

export const PageXPathResultSchema = z
  .object({
    xpath: z.string().optional(),
  })
  .strict()
  .meta({ id: "PageXPathResult" });

export const PageDragAndDropResultSchema = z
  .object({
    fromXpath: z.string().optional(),
    toXpath: z.string().optional(),
  })
  .strict()
  .meta({ id: "PageDragAndDropResult" });

export const PageTypeResultSchema = z
  .object({
    text: z.string(),
  })
  .strict()
  .meta({ id: "PageTypeResult" });

export const PageKeyPressResultSchema = z
  .object({
    key: z.string(),
  })
  .strict()
  .meta({ id: "PageKeyPressResult" });

export const PageEnableCursorOverlayResultSchema = z
  .object({
    enabled: z.boolean(),
  })
  .strict()
  .meta({ id: "PageEnableCursorOverlayResult" });

export const PageAddInitScriptResultSchema = z
  .object({
    added: z.boolean(),
  })
  .strict()
  .meta({ id: "PageAddInitScriptResult" });

export const PageNavigationResultSchema = z
  .object({
    url: z.string(),
    response: z
      .object({
        url: z.string(),
        status: z.number().int(),
        statusText: z.string(),
        ok: z.boolean(),
        headers: PageHeadersSchema,
      })
      .strict()
      .nullable(),
  })
  .strict()
  .meta({ id: "PageNavigationResult" });

export const PageTargetIdResultSchema = z
  .object({
    targetId: PageIdSchema,
  })
  .strict()
  .meta({ id: "PageTargetIdResult" });

export const PageMainFrameIdResultSchema = z
  .object({
    mainFrameId: FrameIdSchema,
  })
  .strict()
  .meta({ id: "PageMainFrameIdResult" });

export const PageFrameSchema = z
  .object({
    frameId: FrameIdSchema,
    pageId: PageIdSchema,
    sessionId: CDPSessionIdSchema.nullable(),
    isBrowserRemote: z.boolean(),
  })
  .strict()
  .meta({ id: "PageFrame" });

export const PageMainFrameResultSchema = z
  .object({
    frame: PageFrameSchema,
  })
  .strict()
  .meta({ id: "PageMainFrameResult" });

export const PageFrameTreeResultSchema = z
  .object({
    frameTree: z.unknown(),
  })
  .strict()
  .meta({ id: "PageFrameTreeResult" });

export const PageListAllFrameIdsResultSchema = z
  .object({
    frameIds: z.array(FrameIdSchema),
  })
  .strict()
  .meta({ id: "PageListAllFrameIdsResult" });

export const PageGetOrdinalResultSchema = z
  .object({
    frameId: FrameIdSchema,
    ordinal: z.number().int().nonnegative(),
  })
  .strict()
  .meta({ id: "PageGetOrdinalResult" });

export const PageTitleResultSchema = z
  .object({
    title: z.string(),
  })
  .strict()
  .meta({ id: "PageTitleResult" });

export const PageUrlResultSchema = z
  .object({
    url: z.string(),
  })
  .strict()
  .meta({ id: "PageUrlResult" });

export const PageScreenshotResultSchema = z
  .object({
    base64: z.string(),
    mimeType: ScreenshotMimeTypeSchema,
  })
  .strict()
  .meta({ id: "PageScreenshotResult" });

export const PageSnapshotResultSchema = z
  .object({
    formattedTree: z.string(),
    xpathMap: z.object({}).catchall(z.string()),
    urlMap: z.object({}).catchall(z.string()),
  })
  .strict()
  .meta({ id: "PageSnapshotResult" });

export const PageSetViewportSizeResultSchema = z
  .object({
    width: z.number().positive(),
    height: z.number().positive(),
    deviceScaleFactor: z.number().positive().optional(),
  })
  .strict()
  .meta({ id: "PageSetViewportSizeResult" });

export const PageFramesResultSchema = z
  .object({
    frames: z.array(PageFrameSchema),
  })
  .strict()
  .meta({ id: "PageFramesResult" });

export const PageSetExtraHTTPHeadersResultSchema = z
  .object({
    headers: PageHeadersSchema,
  })
  .strict()
  .meta({ id: "PageSetExtraHTTPHeadersResult" });

export const PageWaitForLoadStateResultSchema = z
  .object({
    state: LoadStateSchema,
  })
  .strict()
  .meta({ id: "PageWaitForLoadStateResult" });

export const PageWaitForSelectorResultSchema = z
  .object({
    selector: ElementSelectorSchema,
    matched: z.boolean(),
  })
  .strict()
  .meta({ id: "PageWaitForSelectorResult" });

export const PageWaitForTimeoutResultSchema = z
  .object({
    ms: z.number().int().nonnegative(),
  })
  .strict()
  .meta({ id: "PageWaitForTimeoutResult" });

export const PageEvaluateResultSchema = z
  .object({
    value: z.unknown(),
  })
  .strict()
  .meta({ id: "PageEvaluateResult" });

export const PageSendCDPResultSchema = z
  .object({
    value: z.unknown(),
  })
  .strict()
  .meta({ id: "PageSendCDPResult" });

export const PageCloseResultSchema = z
  .object({
    closed: z.boolean(),
  })
  .strict()
  .meta({ id: "PageCloseResult" });

export const PageClickActionSchema = createPageActionSchema(
  "PageClickAction",
  "click",
  PageClickParamsSchema,
  PageXPathResultSchema,
);

export const PageHoverActionSchema = createPageActionSchema(
  "PageHoverAction",
  "hover",
  PageHoverParamsSchema,
  PageXPathResultSchema,
);

export const PageScrollActionSchema = createPageActionSchema(
  "PageScrollAction",
  "scroll",
  PageScrollParamsSchema,
  PageXPathResultSchema,
);

export const PageDragAndDropActionSchema = createPageActionSchema(
  "PageDragAndDropAction",
  "dragAndDrop",
  PageDragAndDropParamsSchema,
  PageDragAndDropResultSchema,
);

export const PageTypeActionSchema = createPageActionSchema(
  "PageTypeAction",
  "type",
  PageTypeParamsSchema,
  PageTypeResultSchema,
);

export const PageKeyPressActionSchema = createPageActionSchema(
  "PageKeyPressAction",
  "keyPress",
  PageKeyPressParamsSchema,
  PageKeyPressResultSchema,
);

export const PageEnableCursorOverlayActionSchema = createPageActionSchema(
  "PageEnableCursorOverlayAction",
  "enableCursorOverlay",
  PageEnableCursorOverlayParamsSchema,
  PageEnableCursorOverlayResultSchema,
);

export const PageAddInitScriptActionSchema = createPageActionSchema(
  "PageAddInitScriptAction",
  "addInitScript",
  PageAddInitScriptParamsSchema,
  PageAddInitScriptResultSchema,
);

export const PageGotoActionSchema = createPageActionSchema(
  "PageGotoAction",
  "goto",
  PageGotoParamsSchema,
  PageNavigationResultSchema,
);

export const PageReloadActionSchema = createPageActionSchema(
  "PageReloadAction",
  "reload",
  PageReloadParamsSchema,
  PageNavigationResultSchema,
);

export const PageGoBackActionSchema = createPageActionSchema(
  "PageGoBackAction",
  "goBack",
  PageGoBackParamsSchema,
  PageNavigationResultSchema,
);

export const PageGoForwardActionSchema = createPageActionSchema(
  "PageGoForwardAction",
  "goForward",
  PageGoForwardParamsSchema,
  PageNavigationResultSchema,
);

export const PageTargetIdActionSchema = createPageActionSchema(
  "PageTargetIdAction",
  "targetId",
  PageTargetIdParamsSchema,
  PageTargetIdResultSchema,
);

export const PageMainFrameIdActionSchema = createPageActionSchema(
  "PageMainFrameIdAction",
  "mainFrameId",
  PageMainFrameIdParamsSchema,
  PageMainFrameIdResultSchema,
);

export const PageMainFrameActionSchema = createPageActionSchema(
  "PageMainFrameAction",
  "mainFrame",
  PageMainFrameParamsSchema,
  PageMainFrameResultSchema,
);

export const PageGetFullFrameTreeActionSchema = createPageActionSchema(
  "PageGetFullFrameTreeAction",
  "getFullFrameTree",
  PageGetFullFrameTreeParamsSchema,
  PageFrameTreeResultSchema,
);

export const PageAsProtocolFrameTreeActionSchema = createPageActionSchema(
  "PageAsProtocolFrameTreeAction",
  "asProtocolFrameTree",
  PageAsProtocolFrameTreeParamsSchema,
  PageFrameTreeResultSchema,
);

export const PageListAllFrameIdsActionSchema = createPageActionSchema(
  "PageListAllFrameIdsAction",
  "listAllFrameIds",
  PageListAllFrameIdsParamsSchema,
  PageListAllFrameIdsResultSchema,
);

export const PageGetOrdinalActionSchema = createPageActionSchema(
  "PageGetOrdinalAction",
  "getOrdinal",
  PageGetOrdinalParamsSchema,
  PageGetOrdinalResultSchema,
);

export const PageTitleActionSchema = createPageActionSchema(
  "PageTitleAction",
  "title",
  PageTitleParamsSchema,
  PageTitleResultSchema,
);

export const PageUrlActionSchema = createPageActionSchema(
  "PageUrlAction",
  "url",
  PageUrlParamsSchema,
  PageUrlResultSchema,
);

export const PageScreenshotActionSchema = createPageActionSchema(
  "PageScreenshotAction",
  "screenshot",
  PageScreenshotParamsSchema,
  PageScreenshotResultSchema,
);

export const PageSnapshotActionSchema = createPageActionSchema(
  "PageSnapshotAction",
  "snapshot",
  PageSnapshotParamsSchema,
  PageSnapshotResultSchema,
);

export const PageFramesActionSchema = createPageActionSchema(
  "PageFramesAction",
  "frames",
  PageFramesParamsSchema,
  PageFramesResultSchema,
);

export const PageSetViewportSizeActionSchema = createPageActionSchema(
  "PageSetViewportSizeAction",
  "setViewportSize",
  PageSetViewportSizeParamsSchema,
  PageSetViewportSizeResultSchema,
);

export const PageSetExtraHTTPHeadersActionSchema = createPageActionSchema(
  "PageSetExtraHTTPHeadersAction",
  "setExtraHTTPHeaders",
  PageSetExtraHTTPHeadersParamsSchema,
  PageSetExtraHTTPHeadersResultSchema,
);

export const PageWaitForLoadStateActionSchema = createPageActionSchema(
  "PageWaitForLoadStateAction",
  "waitForLoadState",
  PageWaitForLoadStateParamsSchema,
  PageWaitForLoadStateResultSchema,
);

export const PageWaitForMainLoadStateActionSchema = createPageActionSchema(
  "PageWaitForMainLoadStateAction",
  "waitForMainLoadState",
  PageWaitForMainLoadStateParamsSchema,
  PageWaitForLoadStateResultSchema,
);

export const PageWaitForSelectorActionSchema = createPageActionSchema(
  "PageWaitForSelectorAction",
  "waitForSelector",
  PageWaitForSelectorParamsSchema,
  PageWaitForSelectorResultSchema,
);

export const PageWaitForTimeoutActionSchema = createPageActionSchema(
  "PageWaitForTimeoutAction",
  "waitForTimeout",
  PageWaitForTimeoutParamsSchema,
  PageWaitForTimeoutResultSchema,
);

export const PageEvaluateActionSchema = createPageActionSchema(
  "PageEvaluateAction",
  "evaluate",
  PageEvaluateParamsSchema,
  PageEvaluateResultSchema,
);

export const PageSendCDPActionSchema = createPageActionSchema(
  "PageSendCDPAction",
  "sendCDP",
  PageSendCDPParamsSchema,
  PageSendCDPResultSchema,
);

export const PageCloseActionSchema = createPageActionSchema(
  "PageCloseAction",
  "close",
  PageCloseParamsSchema,
  PageCloseResultSchema,
);

export const PageActionSchema = z
  .union([
    PageClickActionSchema,
    PageHoverActionSchema,
    PageScrollActionSchema,
    PageDragAndDropActionSchema,
    PageTypeActionSchema,
    PageKeyPressActionSchema,
    PageEnableCursorOverlayActionSchema,
    PageAddInitScriptActionSchema,
    PageGotoActionSchema,
    PageReloadActionSchema,
    PageGoBackActionSchema,
    PageGoForwardActionSchema,
    PageTargetIdActionSchema,
    PageMainFrameIdActionSchema,
    PageMainFrameActionSchema,
    PageGetFullFrameTreeActionSchema,
    PageAsProtocolFrameTreeActionSchema,
    PageListAllFrameIdsActionSchema,
    PageGetOrdinalActionSchema,
    PageTitleActionSchema,
    PageUrlActionSchema,
    PageScreenshotActionSchema,
    PageSnapshotActionSchema,
    PageFramesActionSchema,
    PageSetViewportSizeActionSchema,
    PageSetExtraHTTPHeadersActionSchema,
    PageWaitForLoadStateActionSchema,
    PageWaitForMainLoadStateActionSchema,
    PageWaitForSelectorActionSchema,
    PageWaitForTimeoutActionSchema,
    PageEvaluateActionSchema,
    PageSendCDPActionSchema,
    PageCloseActionSchema,
  ])
  .meta({ id: "PageAction" });

export const V4ErrorResponseSchema = z
  .object({
    success: z.literal(false),
    error: PageErrorSchema,
    statusCode: z.number().int(),
    stack: z.string().nullable(),
    action: PageActionSchema.optional(),
  })
  .strict()
  .meta({ id: "V4ErrorResponse" });

export const PageClickResponseSchema = createPageResponseSchema(
  "PageClickResponse",
  PageClickActionSchema,
);

export const PageHoverResponseSchema = createPageResponseSchema(
  "PageHoverResponse",
  PageHoverActionSchema,
);

export const PageScrollResponseSchema = createPageResponseSchema(
  "PageScrollResponse",
  PageScrollActionSchema,
);

export const PageDragAndDropResponseSchema = createPageResponseSchema(
  "PageDragAndDropResponse",
  PageDragAndDropActionSchema,
);

export const PageTypeResponseSchema = createPageResponseSchema(
  "PageTypeResponse",
  PageTypeActionSchema,
);

export const PageKeyPressResponseSchema = createPageResponseSchema(
  "PageKeyPressResponse",
  PageKeyPressActionSchema,
);

export const PageEnableCursorOverlayResponseSchema = createPageResponseSchema(
  "PageEnableCursorOverlayResponse",
  PageEnableCursorOverlayActionSchema,
);

export const PageAddInitScriptResponseSchema = createPageResponseSchema(
  "PageAddInitScriptResponse",
  PageAddInitScriptActionSchema,
);

export const PageGotoResponseSchema = createPageResponseSchema(
  "PageGotoResponse",
  PageGotoActionSchema,
);

export const PageReloadResponseSchema = createPageResponseSchema(
  "PageReloadResponse",
  PageReloadActionSchema,
);

export const PageGoBackResponseSchema = createPageResponseSchema(
  "PageGoBackResponse",
  PageGoBackActionSchema,
);

export const PageGoForwardResponseSchema = createPageResponseSchema(
  "PageGoForwardResponse",
  PageGoForwardActionSchema,
);

export const PageTargetIdResponseSchema = createPageResponseSchema(
  "PageTargetIdResponse",
  PageTargetIdActionSchema,
);

export const PageMainFrameIdResponseSchema = createPageResponseSchema(
  "PageMainFrameIdResponse",
  PageMainFrameIdActionSchema,
);

export const PageMainFrameResponseSchema = createPageResponseSchema(
  "PageMainFrameResponse",
  PageMainFrameActionSchema,
);

export const PageGetFullFrameTreeResponseSchema = createPageResponseSchema(
  "PageGetFullFrameTreeResponse",
  PageGetFullFrameTreeActionSchema,
);

export const PageAsProtocolFrameTreeResponseSchema = createPageResponseSchema(
  "PageAsProtocolFrameTreeResponse",
  PageAsProtocolFrameTreeActionSchema,
);

export const PageListAllFrameIdsResponseSchema = createPageResponseSchema(
  "PageListAllFrameIdsResponse",
  PageListAllFrameIdsActionSchema,
);

export const PageGetOrdinalResponseSchema = createPageResponseSchema(
  "PageGetOrdinalResponse",
  PageGetOrdinalActionSchema,
);

export const PageTitleResponseSchema = createPageResponseSchema(
  "PageTitleResponse",
  PageTitleActionSchema,
);

export const PageUrlResponseSchema = createPageResponseSchema(
  "PageUrlResponse",
  PageUrlActionSchema,
);

export const PageScreenshotResponseSchema = createPageResponseSchema(
  "PageScreenshotResponse",
  PageScreenshotActionSchema,
);

export const PageSnapshotResponseSchema = createPageResponseSchema(
  "PageSnapshotResponse",
  PageSnapshotActionSchema,
);

export const PageFramesResponseSchema = createPageResponseSchema(
  "PageFramesResponse",
  PageFramesActionSchema,
);

export const PageSetViewportSizeResponseSchema = createPageResponseSchema(
  "PageSetViewportSizeResponse",
  PageSetViewportSizeActionSchema,
);

export const PageSetExtraHTTPHeadersResponseSchema = createPageResponseSchema(
  "PageSetExtraHTTPHeadersResponse",
  PageSetExtraHTTPHeadersActionSchema,
);

export const PageWaitForLoadStateResponseSchema = createPageResponseSchema(
  "PageWaitForLoadStateResponse",
  PageWaitForLoadStateActionSchema,
);

export const PageWaitForMainLoadStateResponseSchema = createPageResponseSchema(
  "PageWaitForMainLoadStateResponse",
  PageWaitForMainLoadStateActionSchema,
);

export const PageWaitForSelectorResponseSchema = createPageResponseSchema(
  "PageWaitForSelectorResponse",
  PageWaitForSelectorActionSchema,
);

export const PageWaitForTimeoutResponseSchema = createPageResponseSchema(
  "PageWaitForTimeoutResponse",
  PageWaitForTimeoutActionSchema,
);

export const PageEvaluateResponseSchema = createPageResponseSchema(
  "PageEvaluateResponse",
  PageEvaluateActionSchema,
);

export const PageSendCDPResponseSchema = createPageResponseSchema(
  "PageSendCDPResponse",
  PageSendCDPActionSchema,
);

export const PageCloseResponseSchema = createPageResponseSchema(
  "PageCloseResponse",
  PageCloseActionSchema,
);

export const PageActionIdParamsSchema = z
  .object({
    actionId: ActionIdSchema,
  })
  .strict()
  .meta({ id: "PageActionIdParams" });

export const PageActionDetailsQuerySchema = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: SessionIdSchema,
  })
  .strict()
  .meta({ id: "PageActionDetailsQuery" });

export const PageActionListQuerySchema = z
  .object({
    id: RequestIdSchema.optional(),
    sessionId: SessionIdSchema,
    pageId: PageIdSchema.optional(),
    method: PageActionMethodSchema.optional(),
    status: PageActionStatusSchema.optional(),
    limit: z.coerce.number().int().positive().max(500).optional(),
  })
  .strict()
  .meta({ id: "PageActionListQuery" });

export const PageActionDetailsResponseSchema = z
  .object({
    success: z.literal(true),
    error: z.null(),
    action: PageActionSchema,
  })
  .strict()
  .meta({ id: "PageActionDetailsResponse" });

export const PageActionListResponseSchema = z
  .object({
    success: z.literal(true),
    error: z.null(),
    actions: z.array(PageActionSchema),
  })
  .strict()
  .meta({ id: "PageActionListResponse" });

export const pageOpenApiComponents = {
  schemas: {
    RequestId: RequestIdSchema,
    SessionId: SessionIdSchema,
    PageId: PageIdSchema,
    FrameId: FrameIdSchema,
    ActionId: ActionIdSchema,
    CDPSessionId: CDPSessionIdSchema,
    Timestamp: TimestampSchema,
    MouseButton: MouseButtonSchema,
    LoadState: LoadStateSchema,
    WaitForSelectorState: WaitForSelectorStateSchema,
    ScreenshotType: ScreenshotTypeSchema,
    ScreenshotMimeType: ScreenshotMimeTypeSchema,
    ScreenshotScale: ScreenshotScaleSchema,
    ScreenshotAnimations: ScreenshotAnimationsSchema,
    ScreenshotCaret: ScreenshotCaretSchema,
    PageActionMethod: PageActionMethodSchema,
    PageActionStatus: PageActionStatusSchema,
    XPathSelector: XPathSelectorSchema,
    CssSelector: CssSelectorSchema,
    TextSelector: TextSelectorSchema,
    CoordinateSelector: CoordinateSelectorSchema,
    Selector: SelectorSchema,
    ElementSelector: ElementSelectorSchema,
    PageHeaders: PageHeadersSchema,
    PageInitScript: PageInitScriptSchema,
    PageClip: PageClipSchema,
    PageError: PageErrorSchema,
    ValidationErrorResponse: ValidationErrorResponseSchema,
    V4ErrorResponse: V4ErrorResponseSchema,
    PageActionBase: PageActionBaseSchema,
    PageClickParams: PageClickParamsSchema,
    PageHoverParams: PageHoverParamsSchema,
    PageScrollElementParams: PageScrollElementParamsSchema,
    PageScrollCoordinateParams: PageScrollCoordinateParamsSchema,
    PageScrollParams: PageScrollParamsSchema,
    PageDragAndDropParams: PageDragAndDropParamsSchema,
    PageTypeParams: PageTypeParamsSchema,
    PageKeyPressParams: PageKeyPressParamsSchema,
    PageEnableCursorOverlayParams: PageEnableCursorOverlayParamsSchema,
    PageAddInitScriptParams: PageAddInitScriptParamsSchema,
    PageGotoParams: PageGotoParamsSchema,
    PageReloadParams: PageReloadParamsSchema,
    PageGoBackParams: PageGoBackParamsSchema,
    PageGoForwardParams: PageGoForwardParamsSchema,
    PageTargetIdParams: PageTargetIdParamsSchema,
    PageMainFrameIdParams: PageMainFrameIdParamsSchema,
    PageMainFrameParams: PageMainFrameParamsSchema,
    PageGetFullFrameTreeParams: PageGetFullFrameTreeParamsSchema,
    PageAsProtocolFrameTreeParams: PageAsProtocolFrameTreeParamsSchema,
    PageListAllFrameIdsParams: PageListAllFrameIdsParamsSchema,
    PageGetOrdinalParams: PageGetOrdinalParamsSchema,
    PageTitleParams: PageTitleParamsSchema,
    PageUrlParams: PageUrlParamsSchema,
    PageScreenshotParams: PageScreenshotParamsSchema,
    PageSnapshotParams: PageSnapshotParamsSchema,
    PageFramesParams: PageFramesParamsSchema,
    PageSetViewportSizeParams: PageSetViewportSizeParamsSchema,
    PageSetExtraHTTPHeadersParams: PageSetExtraHTTPHeadersParamsSchema,
    PageWaitForLoadStateParams: PageWaitForLoadStateParamsSchema,
    PageWaitForMainLoadStateParams: PageWaitForMainLoadStateParamsSchema,
    PageWaitForSelectorParams: PageWaitForSelectorParamsSchema,
    PageWaitForTimeoutParams: PageWaitForTimeoutParamsSchema,
    PageEvaluateParams: PageEvaluateParamsSchema,
    PageSendCDPParams: PageSendCDPParamsSchema,
    PageCloseParams: PageCloseParamsSchema,
    PageClickRequest: PageClickRequestSchema,
    PageHoverRequest: PageHoverRequestSchema,
    PageScrollRequest: PageScrollRequestSchema,
    PageDragAndDropRequest: PageDragAndDropRequestSchema,
    PageTypeRequest: PageTypeRequestSchema,
    PageKeyPressRequest: PageKeyPressRequestSchema,
    PageEnableCursorOverlayRequest: PageEnableCursorOverlayRequestSchema,
    PageAddInitScriptRequest: PageAddInitScriptRequestSchema,
    PageGotoRequest: PageGotoRequestSchema,
    PageReloadRequest: PageReloadRequestSchema,
    PageGoBackRequest: PageGoBackRequestSchema,
    PageGoForwardRequest: PageGoForwardRequestSchema,
    PageTargetIdRequest: PageTargetIdRequestSchema,
    PageMainFrameIdRequest: PageMainFrameIdRequestSchema,
    PageMainFrameRequest: PageMainFrameRequestSchema,
    PageGetFullFrameTreeRequest: PageGetFullFrameTreeRequestSchema,
    PageAsProtocolFrameTreeRequest: PageAsProtocolFrameTreeRequestSchema,
    PageListAllFrameIdsRequest: PageListAllFrameIdsRequestSchema,
    PageGetOrdinalRequest: PageGetOrdinalRequestSchema,
    PageTitleRequest: PageTitleRequestSchema,
    PageUrlRequest: PageUrlRequestSchema,
    PageScreenshotRequest: PageScreenshotRequestSchema,
    PageSnapshotRequest: PageSnapshotRequestSchema,
    PageFramesRequest: PageFramesRequestSchema,
    PageSetViewportSizeRequest: PageSetViewportSizeRequestSchema,
    PageSetExtraHTTPHeadersRequest: PageSetExtraHTTPHeadersRequestSchema,
    PageWaitForLoadStateRequest: PageWaitForLoadStateRequestSchema,
    PageWaitForMainLoadStateRequest: PageWaitForMainLoadStateRequestSchema,
    PageWaitForSelectorRequest: PageWaitForSelectorRequestSchema,
    PageWaitForTimeoutRequest: PageWaitForTimeoutRequestSchema,
    PageEvaluateRequest: PageEvaluateRequestSchema,
    PageSendCDPRequest: PageSendCDPRequestSchema,
    PageCloseRequest: PageCloseRequestSchema,
    PageClickAction: PageClickActionSchema,
    PageHoverAction: PageHoverActionSchema,
    PageScrollAction: PageScrollActionSchema,
    PageDragAndDropAction: PageDragAndDropActionSchema,
    PageTypeAction: PageTypeActionSchema,
    PageKeyPressAction: PageKeyPressActionSchema,
    PageEnableCursorOverlayAction: PageEnableCursorOverlayActionSchema,
    PageAddInitScriptAction: PageAddInitScriptActionSchema,
    PageGotoAction: PageGotoActionSchema,
    PageReloadAction: PageReloadActionSchema,
    PageGoBackAction: PageGoBackActionSchema,
    PageGoForwardAction: PageGoForwardActionSchema,
    PageTargetIdAction: PageTargetIdActionSchema,
    PageMainFrameIdAction: PageMainFrameIdActionSchema,
    PageMainFrameAction: PageMainFrameActionSchema,
    PageGetFullFrameTreeAction: PageGetFullFrameTreeActionSchema,
    PageAsProtocolFrameTreeAction: PageAsProtocolFrameTreeActionSchema,
    PageListAllFrameIdsAction: PageListAllFrameIdsActionSchema,
    PageGetOrdinalAction: PageGetOrdinalActionSchema,
    PageTitleAction: PageTitleActionSchema,
    PageUrlAction: PageUrlActionSchema,
    PageScreenshotAction: PageScreenshotActionSchema,
    PageSnapshotAction: PageSnapshotActionSchema,
    PageFramesAction: PageFramesActionSchema,
    PageSetViewportSizeAction: PageSetViewportSizeActionSchema,
    PageSetExtraHTTPHeadersAction: PageSetExtraHTTPHeadersActionSchema,
    PageWaitForLoadStateAction: PageWaitForLoadStateActionSchema,
    PageWaitForMainLoadStateAction: PageWaitForMainLoadStateActionSchema,
    PageWaitForSelectorAction: PageWaitForSelectorActionSchema,
    PageWaitForTimeoutAction: PageWaitForTimeoutActionSchema,
    PageEvaluateAction: PageEvaluateActionSchema,
    PageSendCDPAction: PageSendCDPActionSchema,
    PageCloseAction: PageCloseActionSchema,
    PageAction: PageActionSchema,
    PageClickResponse: PageClickResponseSchema,
    PageHoverResponse: PageHoverResponseSchema,
    PageScrollResponse: PageScrollResponseSchema,
    PageDragAndDropResponse: PageDragAndDropResponseSchema,
    PageTypeResponse: PageTypeResponseSchema,
    PageKeyPressResponse: PageKeyPressResponseSchema,
    PageEnableCursorOverlayResponse: PageEnableCursorOverlayResponseSchema,
    PageAddInitScriptResponse: PageAddInitScriptResponseSchema,
    PageGotoResponse: PageGotoResponseSchema,
    PageReloadResponse: PageReloadResponseSchema,
    PageGoBackResponse: PageGoBackResponseSchema,
    PageGoForwardResponse: PageGoForwardResponseSchema,
    PageTargetIdResponse: PageTargetIdResponseSchema,
    PageMainFrameIdResponse: PageMainFrameIdResponseSchema,
    PageMainFrameResponse: PageMainFrameResponseSchema,
    PageGetFullFrameTreeResponse: PageGetFullFrameTreeResponseSchema,
    PageAsProtocolFrameTreeResponse: PageAsProtocolFrameTreeResponseSchema,
    PageListAllFrameIdsResponse: PageListAllFrameIdsResponseSchema,
    PageGetOrdinalResponse: PageGetOrdinalResponseSchema,
    PageTitleResponse: PageTitleResponseSchema,
    PageUrlResponse: PageUrlResponseSchema,
    PageScreenshotResponse: PageScreenshotResponseSchema,
    PageSnapshotResponse: PageSnapshotResponseSchema,
    PageFramesResponse: PageFramesResponseSchema,
    PageSetViewportSizeResponse: PageSetViewportSizeResponseSchema,
    PageSetExtraHTTPHeadersResponse: PageSetExtraHTTPHeadersResponseSchema,
    PageWaitForLoadStateResponse: PageWaitForLoadStateResponseSchema,
    PageWaitForMainLoadStateResponse: PageWaitForMainLoadStateResponseSchema,
    PageWaitForSelectorResponse: PageWaitForSelectorResponseSchema,
    PageWaitForTimeoutResponse: PageWaitForTimeoutResponseSchema,
    PageEvaluateResponse: PageEvaluateResponseSchema,
    PageSendCDPResponse: PageSendCDPResponseSchema,
    PageCloseResponse: PageCloseResponseSchema,
    PageActionIdParams: PageActionIdParamsSchema,
    PageActionDetailsQuery: PageActionDetailsQuerySchema,
    PageActionListQuery: PageActionListQuerySchema,
    PageActionDetailsResponse: PageActionDetailsResponseSchema,
    PageActionListResponse: PageActionListResponseSchema,
  },
};

export type PageActionMethod = z.infer<typeof PageActionMethodSchema>;
export type PageActionStatus = z.infer<typeof PageActionStatusSchema>;
export type PageAction = z.infer<typeof PageActionSchema>;
export type PageActionDetailsQuery = z.infer<
  typeof PageActionDetailsQuerySchema
>;
export type PageActionListQuery = z.infer<typeof PageActionListQuerySchema>;

export function buildErrorResponse(input: {
  error: z.input<typeof PageErrorSchema>;
  statusCode: number;
  stack?: string | null;
  action?: z.input<typeof PageActionSchema>;
}) {
  return V4ErrorResponseSchema.parse({
    success: false,
    error: input.error,
    statusCode: input.statusCode,
    stack: input.stack ?? null,
    ...(input.action ? { action: input.action } : {}),
  });
}


================================================
FILE: packages/server-v4/src/sea-entry.ts
================================================
import { __internalMaybeRunShutdownSupervisorFromArgv } from "@browserbasehq/stagehand";

// if SEA binary is launched with --supervisor, it will run the shutdown supervisor only
const argv = process.argv.slice(1);
const normalizedArgv = argv[0]?.startsWith("--") ? argv : argv.slice(1);

// otherwise, start the stagehand/server
if (!__internalMaybeRunShutdownSupervisorFromArgv(normalizedArgv)) {
  void import("./server.js").catch((err) => {
    console.error("Failed to start server:", err);
    process.exit(1);
  });
}


================================================
FILE: packages/server-v4/src/server.ts
================================================
import fastify from "fastify";
import fastifySwagger from "@fastify/swagger";
import fastifySwaggerUI from "@fastify/swagger-ui";
import {
  fastifyZodOpenApiPlugin,
  fastifyZodOpenApiTransformers,
  serializerCompiler,
  validatorCompiler,
  type FastifyZodOpenApiTypeProvider,
} from "fastify-zod-openapi";
import { StatusCodes } from "http-status-codes";

import { browserSessionOpenApiComponents } from "./schemas/v4/browserSession.js";
import { pageOpenApiComponents } from "./schemas/v4/page.js";
import healthcheckRoute from "./routes/healthcheck.js";
import readinessRoute, { setReady, setUnready } from "./routes/readiness.js";
import { browserSessionRoutesPlugin } from "./routes/v4/browsersession/routes.js";
import { pageRoutesPlugin } from "./routes/v4/page/routes.js";

const app = fastify({
  logger: false,
  return503OnClosing: false,
});

// Allow requests with `Content-Type: application/json` and an empty body (0 bytes).
// Some clients always send the header even when there is no request body (e.g. /end).
const defaultJsonParser = app.getDefaultJsonParser("error", "error");
app.addContentTypeParser<string>(
  "application/json",
  { parseAs: "string" },
  (request, body, done) => {
    if (body === "" || (Buffer.isBuffer(body) && body.length === 0)) {
      done(null, {});
      return;
    }

    void defaultJsonParser(request, body, done);
  },
);

const start = async () => {
  try {
    app.setValidatorCompiler(validatorCompiler);
    app.setSerializerCompiler(serializerCompiler);

    await app.register(fastifyZodOpenApiPlugin, {
      components: {
        schemas: {
          ...browserSessionOpenApiComponents.schemas,
          ...pageOpenApiComponents.schemas,
        },
      },
    });

    await app.register(fastifySwagger, {
      openapi: {
        info: {
          title: "Stagehand API",
          version: "3.0.5",
        },
        openapi: "3.1.0",
        tags: [
          {
            name: "browserSession",
            description: "Browser session lifecycle and browser-scoped actions",
          },
          {
            name: "page",
            description: "Page-scoped actions and action history endpoints",
          },
        ],
      },
      ...fastifyZodOpenApiTransformers,
    });

    // Only register Swagger UI in development - SEA binaries can't load static files
    if (process.env.NODE_ENV === "development") {
      await app.register(fastifySwaggerUI, {
        routePrefix: "/documentation",
      });
    }

    app.setErrorHandler((error, _request, reply) => {
      const statusCode = (error as { validation?: unknown[] }).validation
        ? StatusCodes.BAD_REQUEST
        : ((error as { statusCode?: number }).statusCode ??
          StatusCodes.INTERNAL_SERVER_ERROR);
      const errorMessage = (error as { validation?: unknown[] }).validation
        ? "Request validation failed"
        : error instanceof Error
          ? error.message
          : String(error);

      reply.status(statusCode).send({
        error:
          statusCode === Number(StatusCodes.INTERNAL_SERVER_ERROR)
            ? "Internal Server Error"
            : errorMessage,
        statusCode,
      });
    });

    const appWithTypes = app.withTypeProvider<FastifyZodOpenApiTypeProvider>();

    await appWithTypes.register(browserSessionRoutesPlugin, { prefix: "/v4" });
    await appWithTypes.register(pageRoutesPlugin, { prefix: "/v4" });

    // Register health and readiness routes at the root level
    appWithTypes.route(healthcheckRoute);
    appWithTypes.route(readinessRoute);
    await app.ready();

    await app.listen({
      host: "0.0.0.0",
      port: parseInt(process.env.PORT ?? "3000", 10),
    });
    setReady();
  } catch (err) {
    console.error("Failed to start server:", err);
    process.exit(1);
  }
};

const shutdown = async () => {
  setUnready();
  await app.close();
  process.exit(0);
};

process.on("SIGTERM", () => {
  shutdown().catch((err: unknown) => {
    console.error("Failed to shut down cleanly:", err);
    process.exit(1);
  });
});

process.on("SIGINT", () => {
  shutdown().catch((err: unknown) => {
    console.error("Failed to shut down cleanly:", err);
    process.exit(1);
  });
});

start().catch((err: unknown) => {
  console.error("Failed to start server:", err);
  process.exit(1);
});


================================================
FILE: packages/server-v4/src/types/error.ts
================================================
import { StatusCodes } from "http-status-codes";

export class AppError extends Error {
  public readonly statusCode: number;
  public readonly isInternal: boolean;

  constructor(
    message: string,
    statusCode: number = StatusCodes.INTERNAL_SERVER_ERROR,
    isInternal = false,
  ) {
    super(message);
    this.name = new.target.name;
    this.statusCode = statusCode;
    this.isInternal = isInternal;
  }
}

export class UnknownModelError extends AppError {
  constructor(model: string) {
    super(`Unknown model: ${model}`, StatusCodes.BAD_REQUEST);
  }
}
export class InvalidProviderError extends AppError {
  constructor(provider: string) {
    super(`Invalid provider: ${provider}`, StatusCodes.BAD_REQUEST);
  }
}

export class InvalidModelError extends AppError {
  constructor(model: string) {
    super(`Invalid model: ${model}`, StatusCodes.BAD_REQUEST);
  }
}

export class UnauthorizedError extends AppError {
  constructor() {
    super("Unauthorized", StatusCodes.UNAUTHORIZED);
  }
}

export class MissingHeaderError extends AppError {
  constructor(header: string) {
    super(`Missing required header: ${header}`, StatusCodes.BAD_REQUEST);
  }
}

export class InvalidAPIKeyError extends AppError {
  constructor(provider: string) {
    super(`Invalid API key for provider: ${provider}`, StatusCodes.BAD_REQUEST);
  }
}

export class AttemptedCloseOnNonActiveSessionError extends AppError {
  constructor() {
    super(
      "Attempted to close session that is not currently active",
      StatusCodes.CONFLICT,
    );
  }
}

interface BrowserbaseError {
  status?: number;
  statusCode?: number;
  message?: string;
  response?: {
    status?: number;
    data?: {
      message?: string;
    };
  };
}

export class BrowserbaseSDKError extends AppError {
  constructor(error: unknown, defaultMessage: string) {
    const browserbaseError = error as BrowserbaseError;
    const {
      message: errMessage,
      status,
      statusCode: errStatusCode,
      response,
    } = browserbaseError;

    let message = defaultMessage;
    let finalStatusCode = StatusCodes.BAD_REQUEST;

    // Extract message from error
    if (errMessage) {
      message = errMessage;
    } else if (response?.data?.message) {
      ({ message } = response.data);
    }

    // Extract status code from error
    if (status && typeof status === "number") {
      finalStatusCode = status as StatusCodes;
    } else if (errStatusCode && typeof errStatusCode === "number") {
      finalStatusCode = errStatusCode as StatusCodes;
    } else if (response?.status && typeof response.status === "number") {
      finalStatusCode = response.status as StatusCodes;
    }

    // Check for specific session error
    if (message.includes("is not running")) {
      throw new AttemptedCloseOnNonActiveSessionError();
    }

    // Mark 5xx errors as internal to sanitize sensitive details
    const isInternal =
      Number(finalStatusCode) >= Number(StatusCodes.INTERNAL_SERVER_ERROR);

    super(message, finalStatusCode, isInternal);
  }
}


================================================
FILE: packages/server-v4/src/types/fastify.d.ts
================================================
import "fastify";

declare module "fastify" {
  interface FastifyRequest {
    metrics: {
      startTime: number;
    };
  }
}


================================================
FILE: packages/server-v4/src/types/model.ts
================================================
export const AISDK_PROVIDERS = [
  "openai",
  "anthropic",
  "google",
  "xai",
  "azure",
  "groq",
  "cerebras",
  "togetherai",
  "mistral",
  "deepseek",
  "perplexity",
  "ollama",
  "vertex",
  "bedrock",
] as const;
export type AISDKProvider = (typeof AISDK_PROVIDERS)[number];

export type LegacyModel =
  | "gpt-4o"
  | "gpt-4o-mini"
  | "gpt-4o-2024-08-06"
  | "gpt-4o-2024-05-13"
  | "cerebras-llama-3.3-70b"
  | "cerebras-llama-3.1-8b"
  | "o1-mini"
  | "o1-preview"
  | "o3-mini"
  | "gpt-4.5-preview"
  | "groq-llama-3.3-70b-specdec"
  | "groq-llama-3.3-70b-versatile"
  | "gemini-1.5-flash"
  | "gemini-1.5-pro"
  | "gemini-1.5-flash-8b"
  | "gemini-2.0-flash-lite"
  | "gemini-2.0-flash"
  | "gemini-2.5-pro-preview-03-25"
  | "gemini-2.5-flash-preview-04-17";

export type LegacyProvider = "openai" | "anthropic" | "google";


================================================
FILE: packages/server-v4/src/types/rrweb.ts
================================================
export interface Node {
  type: string;
  tagName?: string;
  attributes?: Record<string, string>;
  childNodes?: Node[];
  textContent?: string;
  id: number;
}

export interface Event {
  type: number;
  /*
  The data object is different for each event type
  but we're only accessing it when the data follows
  this structure, so we can just type this way.
  */
  data: { node: Node };
  sessionId?: string;
  timestamp: Date;
  actionId: string;
}


================================================
FILE: packages/server-v4/test/integration/utils.ts
================================================
import fs from "node:fs";
import path from "node:path";
import { chromium } from "playwright";

// =============================================================================
// HTTP Status Codes
// =============================================================================

export const HTTP_OK = 200;
export const HTTP_BAD_REQUEST = 400;
export const HTTP_NOT_FOUND = 404;
export const HTTP_GONE = 410;
export const HTTP_UNPROCESSABLE_ENTITY = 422;
export const HTTP_INTERNAL_SERVER_ERROR = 500;

// =============================================================================
// Timing Constants
// =============================================================================

export const SESSION_CLOSE_WAIT_MS = 2000;

// =============================================================================
// Environment Variables
// =============================================================================

export const {
  STAGEHAND_API_URL,
  OPENAI_API_KEY,
  GEMINI_API_KEY,
  ANTHROPIC_API_KEY,
} = process.env;

// =============================================================================
// Utility Functions
// =============================================================================

export function requireEnv(name: string, value: string | undefined): string {
  if (!value) {
    throw new Error(`Missing required environment variable: ${name}`);
  }
  return value;
}

export function getBaseUrl(): string {
  return STAGEHAND_API_URL ?? "http://127.0.0.1:3107";
}

// =============================================================================
// Header Generators
// =============================================================================

export function getHeaders(
  sdkVersion: string,
  language: string = "typescript",
): Record<string, string> {
  return {
    "Content-Type": "application/json",
    "x-model-api-key": OPENAI_API_KEY ?? "test-model-api-key",
    "x-language": language,
    "x-sdk-version": sdkVersion,
  };
}

// =============================================================================
// Session Management
// =============================================================================

export interface StartSessionResponse {
  success: boolean;
  message?: string;
  data?: {
    browserSession: {
      id: string;
      cdpUrl: string;
      available: boolean;
    };
  };
}

const SESSION_READY_DELAY_MS = 250;
const LOCAL_CONNECT_TIMEOUT_MS = (() => {
  const parsed = Number(process.env.STAGEHAND_TEST_LOCAL_CONNECT_TIMEOUT_MS);
  return Number.isFinite(parsed) && parsed > 0 ? parsed : 60_000;
})();

export interface SessionInfo {
  sessionId: string;
  cdpUrl: string;
}

function createLocalBrowserBody() {
  const resolveChromePath = (): string => {
    const explicit = process.env.CHROME_PATH;
    if (explicit && fs.existsSync(explicit)) {
      return explicit;
    }
    if (explicit) {
      throw new Error(`CHROME_PATH does not exist: ${explicit}`);
    }

    const playwrightPath = chromium.executablePath();
    if (playwrightPath && fs.existsSync(playwrightPath)) {
      return playwrightPath;
    }

    throw new Error(
      "Unable to locate a Chrome executable. Set CHROME_PATH in the test environment.",
    );
  };

  return {
    env: "LOCAL",
    localBrowserLaunchOptions: {
      headless: true,
      executablePath: resolveChromePath(),
      args: process.env.CI ? ["--no-sandbox"] : undefined,
      connectTimeoutMs: LOCAL_CONNECT_TIMEOUT_MS,
    },
  };
}

export const LOCAL_BROWSER_BODY = createLocalBrowserBody();

function readLaunchDiagnostics(launchOptions?: {
  executablePath?: string;
  args?: string[];
  headless?: boolean;
  userDataDir?: string;
  port?: number;
  connectTimeoutMs?: number;
}): string {
  const diagnostics: string[] = [];
  const userDataDir = launchOptions?.userDataDir;
  diagnostics.push("--- launch diagnostics ---");
  diagnostics.push(`CHROME_PATH env: ${process.env.CHROME_PATH ?? "<unset>"}`);
  diagnostics.push(`CI env: ${process.env.CI ?? "<unset>"}`);
  diagnostics.push(`userDataDir: ${userDataDir ?? "<auto>"}`);
  if (!userDataDir) {
    diagnostics.push(
      "chrome stdout/stderr logs unavailable (profile dir auto-managed by server launch)",
    );
  } else {
    diagnostics.push(`userDataDir exists: ${fs.existsSync(userDataDir)}`);
    if (fs.existsSync(userDataDir)) {
      const outPath = path.join(userDataDir, "chrome-out.log");
      const errPath = path.join(userDataDir, "chrome-err.log");
      if (fs.existsSync(outPath)) {
        diagnostics.push(
          `--- chrome stdout ---\n${fs.readFileSync(outPath, "utf8")}`,
        );
      }
      if (fs.existsSync(errPath)) {
        diagnostics.push(
          `--- chrome stderr ---\n${fs.readFileSync(errPath, "utf8")}`,
        );
      }
    }
  }
  if (launchOptions) {
    diagnostics.push(
      `launch.executablePath: ${launchOptions.executablePath ?? "<unset>"}`,
    );
    diagnostics.push(
      `launch.executablePath exists: ${
        launchOptions.executablePath
          ? fs.existsSync(launchOptions.executablePath)
          : false
      }`,
    );
    diagnostics.push(`launch.headless: ${String(launchOptions.headless)}`);
    diagnostics.push(
      `launch.args: ${JSON.stringify(launchOptions.args ?? [])}`,
    );
    diagnostics.push(`launch.port: ${launchOptions.port ?? "<auto>"}`);
    diagnostics.push(
      `launch.connectTimeoutMs: ${launchOptions.connectTimeoutMs ?? "<default>"}`,
    );
  }
  return diagnostics.join("\n");
}

export async function createSession(
  headers: Record<string, string>,
): Promise<string> {
  const info = await createSessionWithCdp(headers);
  return info.sessionId;
}

export async function createSessionWithCdp(
  headers: Record<string, string>,
): Promise<SessionInfo> {
  const url = getBaseUrl();
  const startPayload = {
    modelName: "gpt-4.1-nano",
    ...createLocalBrowserBody(),
  };

  const response = await fetch(`${url}/v4/browsersession`, {
    method: "POST",
    headers,
    body: JSON.stringify(startPayload),
  });

  const responseText = await response.text();
  let parsedBody: unknown;
  try {
    parsedBody = responseText ? JSON.parse(responseText) : null;
  } catch {
    parsedBody = responseText;
  }
  const body = parsedBody as StartSessionResponse;

  if (!response.ok || !body?.success) {
    const launchDiagnostics = readLaunchDiagnostics(
      startPayload.localBrowserLaunchOptions,
    );
    throw new Error(
      `Failed to create session (status=${response.status}): ${JSON.stringify(
        parsedBody,
      )}\n${launchDiagnostics}`,
    );
  }
  if (!body.data?.browserSession.available) {
    throw new Error(`Session not available`);
  }
  if (!body.data.browserSession.id) {
    throw new Error("No browserSession id returned");
  }
  if (!body.data.browserSession.cdpUrl) {
    throw new Error("No cdpUrl returned");
  }

  // Wait for session to be fully ready before returning
  await new Promise((resolve) => setTimeout(resolve, SESSION_READY_DELAY_MS));

  return {
    sessionId: body.data.browserSession.id,
    cdpUrl: body.data.browserSession.cdpUrl,
  };
}

export async function endSession(
  sessionId: string,
  headers: Record<string, string>,
): Promise<void> {
  const url = getBaseUrl();

  await fetch(`${url}/v4/browsersession/${sessionId}/end`, {
    method: "POST",
    headers,
    body: JSON.stringify({}),
  });
}

/**
 * Gets the main frame ID from a CDP session
 */
export async function getMainFrameId(cdpUrl: string): Promise<string> {
  const browser = await chromium.connectOverCDP(cdpUrl);
  try {
    const contexts = browser.contexts();
    if (contexts.length === 0) {
      throw new Error("No browser contexts found");
    }
    const pages = contexts[0]!.pages();
    if (pages.length === 0) {
      throw new Error("No pages found");
    }
    const page = pages[0]!;

    // Use CDP to get the frame tree and extract the main frame ID
    const cdpSession = await page.context().newCDPSession(page);
    const { frameTree } = await cdpSession.send("Page.getFrameTree");
    await cdpSession.detach();

    return frameTree.frame.id;
  } finally {
    await browser.close();
  }
}

// =============================================================================
// SSE Stream Reader
// =============================================================================

// Legacy SSE event interface (generic)
export interface SSEEvent {
  event?: string;
  data?: string;
  parsed?: unknown;
}

export async function readSSEStream(response: Response): Promise<SSEEvent[]> {
  const reader = response.body?.getReader() as
    | ReadableStreamDefaultReader<Uint8Array>
    | undefined;
  if (!reader) {
    throw new Error("No response body reader available");
  }

  const decoder = new TextDecoder();
  let fullResponse = "";

  for (;;) {
    const result = await reader.read();
    if (result.done) break;
    fullResponse += decoder.decode(result.value, { stream: true });
  }

  // Parse SSE events
  const events: SSEEvent[] = [];
  const rawEvents = fullResponse.split("\n\n").filter((e) => e.trim());

  for (const rawEvent of rawEvents) {
    const event: SSEEvent = {};
    const lines = rawEvent.split("\n");

    for (const line of lines) {
      if (line.startsWith("event:")) {
        event.event = line.slice(6).trim();
      } else if (line.startsWith("data:")) {
        event.data = line.slice(5).trim();
        try {
          event.parsed = JSON.parse(event.data);
        } catch {
          // Keep as string if not valid JSON
        }
      }
    }

    if (event.data || event.event) {
      events.push(event);
    }
  }

  return events;
}

// =============================================================================
// Typed SSE Event Helpers (for stagehand-api backend format)
// =============================================================================

// Actual SSE event format from backend (see stream.ts):
// { data: { status: "starting" | "connected" | "finished", result?: ... }, type: "system" | "log", id: "<uuid>" }
export interface TypedSSEEvent<TResult = unknown> {
  data: {
    status: string;
    result?: TResult;
    message?: string;
    error?: string;
  };
  type: string;
  id: string;
}

/**
 * Read SSE stream from response and return raw string
 */
export async function readSSEStreamRaw(response: Response): Promise<string> {
  const reader = response.body?.getReader() as
    | ReadableStreamDefaultReader<Uint8Array>
    | undefined;
  if (!reader) throw new Error("No response body reader");

  const decoder = new TextDecoder();
  let fullResponse = "";

  for (;;) {
    const result = await reader.read();
    if (result.done) break;
    fullResponse += decoder.decode(result.value, { stream: true });
  }

  return fullResponse;
}

/**
 * Parse raw SSE response string into typed events
 */
export function parseTypedSSEEvents<TResult = unknown>(
  rawResponse: string,
): TypedSSEEvent<TResult>[] {
  const events = rawResponse.split("\n\n").filter((e) => e.trim());
  return events
    .map((event) => {
      const dataMatch = event.match(/data: (.+)/);
      if (dataMatch?.[1]) {
        return JSON.parse(dataMatch[1]) as TypedSSEEvent<TResult>;
      }
      return null;
    })
    .filter((e): e is TypedSSEEvent<TResult> => e !== null);
}

/**
 * Result of reading an SSE stream with full context for debugging
 */
export interface SSEStreamResult<TResult = unknown> {
  /** HTTP status code */
  status: number;
  /** HTTP status text */
  statusText: string;
  /** Raw response body */
  raw: string;
  /** Parsed SSE events */
  events: TypedSSEEvent<TResult>[];
  /** Get debug summary for error messages */
  debugSummary(): string;
}

/**
 * Read SSE stream and parse into typed events (legacy - no debug context)
 */
export async function readTypedSSEStream<TResult = unknown>(
  response: Response,
): Promise<TypedSSEEvent<TResult>[]> {
  const raw = await readSSEStreamRaw(response);
  return parseTypedSSEEvents<TResult>(raw);
}

/**
 * Read SSE stream with full context for debugging test failures.
 * Use this instead of readTypedSSEStream when you need better error messages.
 */
export async function readTypedSSEStreamWithContext<TResult = unknown>(
  response: Response,
): Promise<SSEStreamResult<TResult>> {
  const status = response.status;
  const statusText = response.statusText;
  const raw = await readSSEStreamRaw(response);
  const events = parseTypedSSEEvents<TResult>(raw);

  return {
    status,
    statusText,
    raw,
    events,
    debugSummary() {
      const eventStatuses = events.map((e) => e.data.status).join(" → ");
      const errorEvents = events.filter((e) => e.data.status === "error");
      const errorMessages = errorEvents
        .map((e) => e.data.error ?? "unknown error")
        .join(", ");

      let summary = `HTTP ${status} ${statusText}`;
      if (events.length === 0) {
        summary += `\n  No SSE events received`;
        summary += `\n  Raw response: ${raw.slice(0, 500)}${raw.length > 500 ? "..." : ""}`;
      } else {
        summary += `\n  Events (${events.length}): ${eventStatuses}`;
        if (errorMessages) {
          summary += `\n  Errors: ${errorMessages}`;
        }
      }
      return summary;
    },
  };
}

/**
 * Assert with debug context - includes SSE stream info on failure
 */
export function assertWithContext(
  condition: boolean,
  message: string,
  context: SSEStreamResult<unknown>,
): asserts condition {
  if (!condition) {
    throw new Error(`${message}\n\nDebug context:\n${context.debugSummary()}`);
  }
}

/**
 * Assert SSE event exists with debug context on failure, returns the found event
 */
export function assertEventExists<TResult>(
  events: TypedSSEEvent<TResult>[],
  status: string,
  context: SSEStreamResult<TResult>,
): TypedSSEEvent<TResult> {
  const found = events.find((e) => e.data.status === status);
  assertWithContext(
    found !== undefined,
    `Should have a "${status}" event`,
    context,
  );
  return found;
}

/**
 * Assert HTTP status with debug context on failure
 */
export function assertHttpStatus(
  context: SSEStreamResult<unknown>,
  expectedStatus: number,
  message?: string,
): void {
  assertWithContext(
    context.status === expectedStatus,
    message ?? `Expected HTTP ${expectedStatus}, got ${context.status}`,
    context,
  );
}

// =============================================================================
// JSON Response Debug Utilities (for non-SSE tests)
// =============================================================================

/**
 * Result of a fetch request with full context for debugging
 */
export interface FetchResult<T = unknown> {
  /** HTTP status code */
  status: number;
  /** HTTP status text */
  statusText: string;
  /** Parsed JSON body (if parseable) */
  body: T | null;
  /** Raw response text */
  raw: string;
  /** Request duration in ms */
  durationMs: number;
  /** Response headers */
  headers: Headers;
  /** Get debug summary for error messages */
  debugSummary(): string;
}

/**
 * Fetch with full context for debugging test failures.
 * Captures timing, status, and response body.
 */
export async function fetchWithContext<T = unknown>(
  url: string,
  options: RequestInit,
): Promise<FetchResult<T>> {
  const startTime = Date.now();
  let response: Response;

  try {
    response = await fetch(url, options);
  } catch (err) {
    const durationMs = Date.now() - startTime;
    const errorMsg = err instanceof Error ? err.message : String(err);
    return {
      status: 0,
      statusText: "FETCH_ERROR",
      body: null,
      raw: errorMsg,
      durationMs,
      headers: new Headers(),
      debugSummary() {
        return `Fetch failed after ${durationMs}ms: ${errorMsg}`;
      },
    };
  }

  const durationMs = Date.now() - startTime;
  const status = response.status;
  const statusText = response.statusText;
  const headers = response.headers;
  const raw = await response.text();

  let body: T | null = null;
  try {
    body = JSON.parse(raw) as T;
  } catch {
    // Keep body as null if not valid JSON
  }

  return {
    status,
    statusText,
    body,
    raw,
    durationMs,
    headers,
    debugSummary() {
      const seconds = (durationMs / 1000).toFixed(1);
      let summary = `HTTP ${status} ${statusText} (${seconds}s)`;

      if (body && typeof body === "object") {
        const b = body as Record<string, unknown>;
        if (b.success === false && typeof b.message === "string") {
          summary += `\n  Error: ${b.message}`;
        }
        if (typeof b.error === "string") {
          summary += `\n  Error: ${b.error}`;
        }
      }

      // Show raw response if it's an error or unexpected
      if (status >= 400 || !body) {
        const truncated = raw.slice(0, 500);
        summary += `\n  Response: ${truncated}${raw.length > 500 ? "..." : ""}`;
      }

      return summary;
    },
  };
}

/**
 * Assert with fetch context - includes response info on failure
 */
export function assertFetchOk<T>(
  condition: boolean,
  message: string,
  context: FetchResult<T>,
): asserts condition {
  if (!condition) {
    throw new Error(`${message}\n\nDebug context:\n${context.debugSummary()}`);
  }
}

/**
 * Assert fetch succeeded with expected status
 */
export function assertFetchStatus<T>(
  context: FetchResult<T>,
  expectedStatus: number,
  message?: string,
): void {
  assertFetchOk(
    context.status === expectedStatus,
    message ?? `Expected HTTP ${expectedStatus}, got ${context.status}`,
    context,
  );
}


================================================
FILE: packages/server-v4/test/integration/v4/browsersession.test.ts
================================================
import assert from "node:assert/strict";
import { describe, it } from "node:test";

import {
  assertFetchOk,
  assertFetchStatus,
  fetchWithContext,
  getBaseUrl,
  getHeaders,
  HTTP_BAD_REQUEST,
  HTTP_NOT_FOUND,
  HTTP_OK,
  LOCAL_BROWSER_BODY,
} from "../utils.js";

interface BrowserSessionRecord {
  id: string;
  env: "LOCAL" | "BROWSERBASE";
  status: "running" | "ended";
  modelName: string;
  cdpUrl: string;
  available: boolean;
}

interface BrowserSessionResponse {
  success: boolean;
  message?: string;
  data?: {
    browserSession: BrowserSessionRecord;
  };
}

const headers = getHeaders("4.0.0");

describe("v4 browsersession routes", { concurrency: false }, () => {
  it("POST /v4/browsersession creates a local browser session and GET/POST end work", async () => {
    const createCtx = await fetchWithContext<BrowserSessionResponse>(
      `${getBaseUrl()}/v4/browsersession`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          modelName: "gpt-4.1-nano",
          ...LOCAL_BROWSER_BODY,
        }),
      },
    );

    assertFetchStatus(createCtx, HTTP_OK);
    assertFetchOk(
      createCtx.body !== null,
      "Expected a JSON response body",
      createCtx,
    );
    assert.equal(createCtx.body.success, true);
    assertFetchOk(
      createCtx.body.data?.browserSession !== undefined,
      "Expected a browserSession payload",
      createCtx,
    );

    const browserSession = createCtx.body.data!.browserSession;
    assert.equal(browserSession.env, "LOCAL");
    assert.equal(browserSession.status, "running");
    assert.equal(browserSession.modelName, "gpt-4.1-nano");
    assert.equal(browserSession.available, true);
    assert.ok(browserSession.cdpUrl.length > 0);

    const statusCtx = await fetchWithContext<BrowserSessionResponse>(
      `${getBaseUrl()}/v4/browsersession/${browserSession.id}`,
      {
        method: "GET",
        headers,
      },
    );

    assertFetchStatus(statusCtx, HTTP_OK);
    assertFetchOk(
      statusCtx.body !== null,
      "Expected a JSON response body",
      statusCtx,
    );
    assert.equal(statusCtx.body.data?.browserSession.id, browserSession.id);
    assert.equal(statusCtx.body.data?.browserSession.status, "running");

    const endCtx = await fetchWithContext<BrowserSessionResponse>(
      `${getBaseUrl()}/v4/browsersession/${browserSession.id}/end`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({}),
      },
    );

    assertFetchStatus(endCtx, HTTP_OK);
    assertFetchOk(
      endCtx.body !== null,
      "Expected a JSON response body",
      endCtx,
    );
    assert.equal(endCtx.body.data?.browserSession.id, browserSession.id);
    assert.equal(endCtx.body.data?.browserSession.status, "ended");
    assert.equal(endCtx.body.data?.browserSession.available, false);

    const missingCtx = await fetchWithContext<BrowserSessionResponse>(
      `${getBaseUrl()}/v4/browsersession/${browserSession.id}`,
      {
        method: "GET",
        headers,
      },
    );

    assertFetchStatus(missingCtx, HTTP_NOT_FOUND);
    assertFetchOk(
      missingCtx.body !== null,
      "Expected a JSON response body",
      missingCtx,
    );
    assert.equal(missingCtx.body.success, false);
  });

  it("POST /v4/browsersession rejects LOCAL requests without cdpUrl or localBrowserLaunchOptions", async () => {
    const ctx = await fetchWithContext<BrowserSessionResponse>(
      `${getBaseUrl()}/v4/browsersession`,
      {
        method: "POST",
        headers,
        body: JSON.stringify({
          env: "LOCAL",
          modelName: "gpt-4.1-nano",
        }),
      },
    );

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(ctx.body !== null, "Expected a JSON response body", ctx);
    assert.equal(ctx.body.success, false);
    assert.ok(ctx.body.message);
  });
});


================================================
FILE: packages/server-v4/test/integration/v4/page.test.ts
================================================
import assert from "node:assert/strict";
import { createServer } from "node:http";
import { after, before, describe, it } from "node:test";

import type { Page } from "playwright";
import { chromium } from "playwright";

import {
  assertFetchOk,
  assertFetchStatus,
  createSessionWithCdp,
  endSession,
  fetchWithContext,
  getBaseUrl,
  getMainFrameId,
  getHeaders,
  HTTP_BAD_REQUEST,
  HTTP_OK,
} from "../utils.js";

interface PageActionRecord {
  id: string;
  method: string;
  status: string;
  sessionId: string;
  pageId?: string;
  createdAt?: string;
  updatedAt?: string;
  completedAt?: string;
  error?: string | null;
  [key: string]: unknown;
}

interface PageActionResponse {
  success: boolean;
  error: string | null;
  statusCode?: number;
  stack?: string | null;
  action?: PageActionRecord;
  actions?: PageActionRecord[];
}

const headers = getHeaders("3.0.0");

const GOTO_TEST_URL = `data:text/html;charset=utf-8,${encodeURIComponent(`
<!doctype html>
<html>
  <head>
    <meta charset="utf-8" />
    <title>V4 goto route</title>
  </head>
  <body>
    <main id="message">goto-ok</main>
  </body>
</html>
`)}`;

const CLICK_TEST_URL = `data:text/html;charset=utf-8,${encodeURIComponent(`
<!doctype html>
<html>
  <head>
    <meta charset="utf-8" />
    <title>V4 click route</title>
  </head>
  <body data-clicked="no">
    <button
      id="click-target"
      onclick="document.body.dataset.clicked='yes';document.getElementById('status').textContent='clicked';"
    >
      Submit
    </button>
    <div id="status">idle</div>
  </body>
</html>
`)}`;

const METHODS_TEST_URL = `data:text/html;charset=utf-8,${encodeURIComponent(`
<!doctype html>
<html>
  <head>
    <meta charset="utf-8" />
    <title>V4 methods route</title>
    <style>
      body { font-family: sans-serif; }
      #scroll-box {
        border: 1px solid #333;
        height: 80px;
        overflow: auto;
        width: 200px;
      }
      #scroll-inner {
        height: 400px;
      }
      #drag-source, #drag-target {
        align-items: center;
        border: 1px solid #333;
        display: flex;
        height: 40px;
        justify-content: center;
        margin-top: 8px;
        width: 120px;
      }
    </style>
  </head>
  <body data-hovered="no" data-dropped="no">
    <main id="message">methods-ok</main>
    <input id="text-input" value="" />
    <button
      id="hover-target"
      onmouseover="document.body.dataset.hovered='yes';"
    >
      Hover me
    </button>
    <div id="scroll-box">
      <div id="scroll-inner">scroll target</div>
    </div>
    <div
      id="drag-source"
      onmousedown="window.__dragStart = true;"
    >
      Drag source
    </div>
    <div
      id="drag-target"
      onmouseup="if (window.__dragStart) { document.body.dataset.dropped='yes'; }"
    >
      Drop target
    </div>
    <script>
      setTimeout(() => {
        const lateItem = document.createElement("div");
        lateItem.id = "late-item";
        lateItem.textContent = "ready";
        document.body.appendChild(lateItem);
      }, 150);
    </script>
  </body>
</html>
`)}`;

async function withSessionPage<T>(
  cdpUrl: string,
  fn: (page: Page) => Promise<T>,
): Promise<T> {
  const browser = await chromium.connectOverCDP(cdpUrl);

  try {
    const contexts = browser.contexts();
    assert.ok(contexts.length > 0, "Expected at least one browser context");

    const pages = contexts[0]!.pages();
    assert.ok(pages.length > 0, "Expected at least one browser page");

    return await fn(pages[0]!);
  } finally {
    await browser.close();
  }
}

async function postPageRoute(
  path: string,
  sessionId: string,
  params: Record<string, unknown>,
) {
  return fetchWithContext<PageActionResponse>(
    `${getBaseUrl()}/v4/page/${path}`,
    {
      method: "POST",
      headers,
      body: JSON.stringify({
        sessionId,
        params,
      }),
    },
  );
}

async function getPageRoute(
  path: string,
  sessionId: string,
  params: Record<string, unknown>,
) {
  const searchParams = new URLSearchParams();
  searchParams.set("sessionId", sessionId);

  for (const [key, value] of Object.entries(params)) {
    searchParams.set(key, String(value));
  }

  return fetchWithContext<PageActionResponse>(
    `${getBaseUrl()}/v4/page/${path}?${searchParams.toString()}`,
    {
      method: "GET",
      headers,
    },
  );
}

function assertSuccessAction(
  ctx: Awaited<ReturnType<typeof fetchWithContext<PageActionResponse>>>,
  expectedType: string,
): PageActionRecord {
  assertFetchStatus(ctx, HTTP_OK);
  assertFetchOk(ctx.body !== null, "Expected a JSON response body", ctx);
  assert.equal(ctx.body.success, true);
  assert.equal(ctx.body.error, null);
  assertFetchOk(
    ctx.body.action !== undefined,
    "Expected an action payload",
    ctx,
  );

  const action = ctx.body.action;
  assert.equal(typeof action.id, "string");
  assert.notEqual(action.id.length, 0);
  assert.equal(action.method, expectedType);
  assert.equal(action.status, "completed");

  return action;
}

function assertSuccessActionList(
  ctx: Awaited<ReturnType<typeof fetchWithContext<PageActionResponse>>>,
) {
  assertFetchStatus(ctx, HTTP_OK);
  assertFetchOk(ctx.body !== null, "Expected a JSON response body", ctx);
  assert.equal(ctx.body.success, true);
  assert.equal(ctx.body.error, null);
  assertFetchOk(
    Array.isArray(ctx.body.actions),
    "Expected an actions array payload",
    ctx,
  );

  return ctx.body.actions;
}

describe("v4 page routes", { concurrency: false }, () => {
  let sessionId: string;
  let cdpUrl: string;

  before(async () => {
    ({ sessionId, cdpUrl } = await createSessionWithCdp(headers));
  });

  after(async () => {
    await endSession(sessionId, headers);
  });

  it("POST /v4/page/goto returns the new envelope and navigates a real local session", async () => {
    const ctx = await postPageRoute("goto", sessionId, {
      url: GOTO_TEST_URL,
      waitUntil: "load",
    });

    const action = assertSuccessAction(ctx, "goto");
    assert.equal(action.sessionId, sessionId);
    assert.equal(
      (action.result as { response: unknown | null; url: string }).url,
      GOTO_TEST_URL,
    );
    assert.equal(
      (action.result as { response: unknown | null }).response,
      null,
    );

    await withSessionPage(cdpUrl, async (page) => {
      await page.waitForLoadState("load", { timeout: 15_000 }).catch(() => {});
      assert.equal(await page.title(), "V4 goto route");
      assert.equal(await page.textContent("#message"), "goto-ok");
    });
  });

  it("POST /v4/page/click returns the new envelope and clicks a real page element", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: CLICK_TEST_URL,
      waitUntil: "load",
    });
    const gotoAction = assertSuccessAction(gotoCtx, "goto");

    const clickCtx = await postPageRoute("click", sessionId, {
      pageId: gotoAction.pageId,
      selector: {
        xpath: "//button[@id='click-target']",
      },
    });

    const action = assertSuccessAction(clickCtx, "click");
    assert.equal(action.sessionId, sessionId);

    await withSessionPage(cdpUrl, async (page) => {
      await page.waitForFunction(
        () => document.body.dataset.clicked === "yes",
        undefined,
        {
          timeout: 15_000,
        },
      );
      assert.equal(await page.locator("#status").textContent(), "clicked");
    });
  });

  it("POST /v4/page methods route through the underlying understudy implementation", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: METHODS_TEST_URL,
      waitUntil: "load",
    });
    assertSuccessAction(gotoCtx, "goto");

    const hoverCtx = await postPageRoute("hover", sessionId, {
      selector: {
        xpath: "//button[@id='hover-target']",
      },
    });
    assertSuccessAction(hoverCtx, "hover");

    const scrollCtx = await postPageRoute("scroll", sessionId, {
      selector: {
        xpath: "//div[@id='scroll-box']",
      },
      percentage: 100,
    });
    assertSuccessAction(scrollCtx, "scroll");

    const dragCtx = await postPageRoute("dragAndDrop", sessionId, {
      from: {
        xpath: "//div[@id='drag-source']",
      },
      to: {
        xpath: "//div[@id='drag-target']",
      },
    });
    assertSuccessAction(dragCtx, "dragAndDrop");

    const focusInputCtx = await postPageRoute("click", sessionId, {
      selector: {
        xpath: "//input[@id='text-input']",
      },
    });
    assertSuccessAction(focusInputCtx, "click");

    const typeCtx = await postPageRoute("type", sessionId, {
      text: "hello",
    });
    assertSuccessAction(typeCtx, "type");

    const keyPressCtx = await postPageRoute("keyPress", sessionId, {
      key: "Backspace",
    });
    assertSuccessAction(keyPressCtx, "keyPress");

    const waitForSelectorCtx = await postPageRoute(
      "waitForSelector",
      sessionId,
      {
        selector: {
          xpath: "//div[@id='late-item']",
        },
        state: "visible",
        timeout: 5_000,
      },
    );
    const waitForSelectorAction = assertSuccessAction(
      waitForSelectorCtx,
      "waitForSelector",
    );
    assert.equal(
      (waitForSelectorAction.result as { matched: boolean }).matched,
      true,
    );

    const waitForLoadStateCtx = await postPageRoute(
      "waitForLoadState",
      sessionId,
      {
        state: "load",
      },
    );
    assertSuccessAction(waitForLoadStateCtx, "waitForLoadState");

    const titleCtx = await getPageRoute("title", sessionId, {});
    const titleAction = assertSuccessAction(titleCtx, "title");
    assert.equal(
      (titleAction.result as { title: string }).title,
      "V4 methods route",
    );

    const urlCtx = await getPageRoute("url", sessionId, {});
    const urlAction = assertSuccessAction(urlCtx, "url");
    assert.equal((urlAction.result as { url: string }).url, METHODS_TEST_URL);

    const evaluateCtx = await postPageRoute("evaluate", sessionId, {
      expression: "arg.value * 2",
      arg: {
        value: 21,
      },
    });
    const evaluateAction = assertSuccessAction(evaluateCtx, "evaluate");
    assert.equal((evaluateAction.result as { value: number }).value, 42);

    const sendCDPCtx = await postPageRoute("sendCDP", sessionId, {
      method: "Runtime.evaluate",
      params: {
        expression: "6 * 7",
        returnByValue: true,
      },
    });
    const sendCDPAction = assertSuccessAction(sendCDPCtx, "sendCDP");
    assert.equal(
      (
        sendCDPAction.result as {
          value: { result?: { value?: number } };
        }
      ).value.result?.value,
      42,
    );

    await withSessionPage(cdpUrl, async (page) => {
      await page.waitForFunction(
        () => document.body.dataset.hovered === "yes",
        undefined,
        { timeout: 5_000 },
      );
      await page.waitForFunction(
        () => document.body.dataset.dropped === "yes",
        undefined,
        { timeout: 5_000 },
      );
      assert.equal(await page.locator("#text-input").inputValue(), "hell");
      assert.ok(
        await page
          .locator("#scroll-box")
          .evaluate((node) => (node as HTMLDivElement).scrollTop > 0),
      );
    });
  });

  it("POST /v4/page navigation helpers, screenshot, snapshot, viewport, timeout, and close work on a live session", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: METHODS_TEST_URL,
      waitUntil: "load",
    });
    const gotoAction = assertSuccessAction(gotoCtx, "goto");
    assert.equal(
      (gotoAction.result as { response: unknown | null; url: string }).url,
      METHODS_TEST_URL,
    );
    assert.equal(
      (gotoAction.result as { response: unknown | null }).response,
      null,
    );

    const setViewportSizeCtx = await postPageRoute(
      "setViewportSize",
      sessionId,
      {
        width: 900,
        height: 700,
        deviceScaleFactor: 1,
      },
    );
    assertSuccessAction(setViewportSizeCtx, "setViewportSize");

    const screenshotCtx = await postPageRoute("screenshot", sessionId, {
      type: "jpeg",
      quality: 70,
    });
    const screenshotAction = assertSuccessAction(screenshotCtx, "screenshot");
    const screenshotResult = screenshotAction.result as {
      base64: string;
      mimeType: string;
    };
    assert.equal(screenshotResult.mimeType, "image/jpeg");
    assert.ok(screenshotResult.base64.length > 0);

    const snapshotCtx = await postPageRoute("snapshot", sessionId, {
      includeIframes: true,
    });
    const snapshotAction = assertSuccessAction(snapshotCtx, "snapshot");
    assert.match(
      (snapshotAction.result as { formattedTree: string }).formattedTree,
      /methods-ok/i,
    );

    const waitStart = Date.now();
    const waitCtx = await postPageRoute("waitForTimeout", sessionId, {
      ms: 75,
    });
    assertSuccessAction(waitCtx, "waitForTimeout");
    assert.ok(Date.now() - waitStart >= 50);

    const zeroWaitCtx = await postPageRoute("waitForTimeout", sessionId, {
      ms: 0,
    });
    assertSuccessAction(zeroWaitCtx, "waitForTimeout");

    const reloadCtx = await postPageRoute("reload", sessionId, {
      waitUntil: "load",
    });
    const reloadAction = assertSuccessAction(reloadCtx, "reload");
    assert.equal(
      (reloadAction.result as { response: unknown | null; url: string }).url,
      METHODS_TEST_URL,
    );
    assert.equal(
      (reloadAction.result as { response: unknown | null }).response,
      null,
    );

    await withSessionPage(cdpUrl, async (page) => {
      const viewport = await page.evaluate(() => ({
        width: window.innerWidth,
        height: window.innerHeight,
      }));
      assert.equal(viewport.width, 900);
      assert.equal(viewport.height, 700);
      assert.equal(
        await page.evaluate(
          () =>
            performance.getEntriesByType("navigation")[0]?.toJSON().type ?? "",
        ),
        "reload",
      );
    });

    const gotoBackTargetCtx = await postPageRoute("goto", sessionId, {
      url: GOTO_TEST_URL,
      waitUntil: "load",
    });
    assertSuccessAction(gotoBackTargetCtx, "goto");

    const goBackCtx = await postPageRoute("goBack", sessionId, {
      waitUntil: "load",
    });
    const goBackAction = assertSuccessAction(goBackCtx, "goBack");
    assert.equal(
      (goBackAction.result as { response: unknown | null; url: string }).url,
      METHODS_TEST_URL,
    );
    assert.equal(
      (goBackAction.result as { response: unknown | null }).response,
      null,
    );

    await withSessionPage(cdpUrl, async (page) => {
      assert.equal(await page.title(), "V4 methods route");
    });

    const goForwardCtx = await postPageRoute("goForward", sessionId, {
      waitUntil: "load",
    });
    const goForwardAction = assertSuccessAction(goForwardCtx, "goForward");
    assert.equal(
      (goForwardAction.result as { response: unknown | null; url: string }).url,
      GOTO_TEST_URL,
    );
    assert.equal(
      (goForwardAction.result as { response: unknown | null }).response,
      null,
    );

    await withSessionPage(cdpUrl, async (page) => {
      assert.equal(await page.title(), "V4 goto route");
    });

    const temp = await createSessionWithCdp(headers);
    try {
      const closeGotoCtx = await postPageRoute("goto", temp.sessionId, {
        url: GOTO_TEST_URL,
        waitUntil: "load",
      });
      assertSuccessAction(closeGotoCtx, "goto");

      const closeCtx = await fetchWithContext<PageActionResponse>(
        `${getBaseUrl()}/v4/page/close`,
        {
          method: "POST",
          headers,
          body: JSON.stringify({
            sessionId: temp.sessionId,
            params: {},
          }),
        },
      );
      assertSuccessAction(closeCtx, "close");

      const browser = await chromium.connectOverCDP(temp.cdpUrl);
      try {
        const contexts = browser.contexts();
        const pages = contexts.flatMap((context) => context.pages());
        assert.equal(pages.length, 0);
      } finally {
        await browser.close();
      }
    } finally {
      await endSession(temp.sessionId, headers);
    }
  });

  it("GET page getters and POST page config methods expose the underlying understudy interface", async () => {
    const temp = await createSessionWithCdp(headers);
    let requestHeaders: Record<string, string | string[] | undefined> | null =
      null;
    const server = createServer((req, res) => {
      if (req.url === "/") {
        requestHeaders = req.headers;
      }

      res.writeHead(200, { "content-type": "text/html; charset=utf-8" });
      res.end(`<!doctype html>
<html>
  <head>
    <meta charset="utf-8" />
    <title>V4 header route</title>
  </head>
  <body>
    <main id="message">header-ok</main>
  </body>
</html>`);
    });

    await new Promise<void>((resolve) => {
      server.listen(0, "127.0.0.1", () => resolve());
    });

    const address = server.address();
    assert.ok(address && typeof address === "object");
    const url = `http://127.0.0.1:${address.port}/`;

    try {
      const enableCursorOverlayCtx = await postPageRoute(
        "enableCursorOverlay",
        temp.sessionId,
        {},
      );
      const enableCursorOverlayAction = assertSuccessAction(
        enableCursorOverlayCtx,
        "enableCursorOverlay",
      );
      assert.equal(
        (enableCursorOverlayAction.result as { enabled: boolean }).enabled,
        true,
      );

      const addInitScriptCtx = await postPageRoute(
        "addInitScript",
        temp.sessionId,
        {
          script: "window.__v4InitValue = 'present';",
        },
      );
      const addInitScriptAction = assertSuccessAction(
        addInitScriptCtx,
        "addInitScript",
      );
      assert.equal(
        (addInitScriptAction.result as { added: boolean }).added,
        true,
      );

      const setHeadersCtx = await postPageRoute(
        "setExtraHTTPHeaders",
        temp.sessionId,
        {
          headers: {
            "x-stagehand-test": "present",
          },
        },
      );
      const setHeadersAction = assertSuccessAction(
        setHeadersCtx,
        "setExtraHTTPHeaders",
      );
      assert.equal(
        (
          setHeadersAction.result as {
            headers: Record<string, string>;
          }
        ).headers["x-stagehand-test"],
        "present",
      );

      const gotoCtx = await postPageRoute("goto", temp.sessionId, {
        url,
        waitUntil: "load",
      });
      const gotoAction = assertSuccessAction(gotoCtx, "goto");
      assert.equal(requestHeaders?.["x-stagehand-test"], "present");

      const targetIdCtx = await getPageRoute("targetId", temp.sessionId, {});
      const targetIdAction = assertSuccessAction(targetIdCtx, "targetId");
      assert.equal(
        (targetIdAction.result as { targetId: string }).targetId,
        gotoAction.pageId,
      );

      const mainFrameIdCtx = await getPageRoute(
        "mainFrameId",
        temp.sessionId,
        {},
      );
      const mainFrameIdAction = assertSuccessAction(
        mainFrameIdCtx,
        "mainFrameId",
      );
      const mainFrameId = (mainFrameIdAction.result as { mainFrameId: string })
        .mainFrameId;
      assert.equal(mainFrameId, await getMainFrameId(temp.cdpUrl));

      const mainFrameCtx = await getPageRoute("mainFrame", temp.sessionId, {});
      const mainFrameAction = assertSuccessAction(mainFrameCtx, "mainFrame");
      assert.equal(
        (
          mainFrameAction.result as {
            frame: { frameId: string };
          }
        ).frame.frameId,
        mainFrameId,
      );

      const framesCtx = await getPageRoute("frames", temp.sessionId, {});
      const framesAction = assertSuccessAction(framesCtx, "frames");
      const frames = (
        framesAction.result as {
          frames: Array<{ frameId: string }>;
        }
      ).frames;
      assert.ok(frames.some((frame) => frame.frameId === mainFrameId));

      const fullFrameTreeCtx = await getPageRoute(
        "getFullFrameTree",
        temp.sessionId,
        {},
      );
      const fullFrameTreeAction = assertSuccessAction(
        fullFrameTreeCtx,
        "getFullFrameTree",
      );
      assert.equal(
        (
          fullFrameTreeAction.result as {
            frameTree: { frame: { id: string } };
          }
        ).frameTree.frame.id,
        mainFrameId,
      );

      const protocolFrameTreeCtx = await getPageRoute(
        "asProtocolFrameTree",
        temp.sessionId,
        { rootMainFrameId: mainFrameId },
      );
      const protocolFrameTreeAction = assertSuccessAction(
        protocolFrameTreeCtx,
        "asProtocolFrameTree",
      );
      assert.equal(
        (
          protocolFrameTreeAction.result as {
            frameTree: { frame: { id: string } };
          }
        ).frameTree.frame.id,
        mainFrameId,
      );

      const listAllFrameIdsCtx = await getPageRoute(
        "listAllFrameIds",
        temp.sessionId,
        {},
      );
      const listAllFrameIdsAction = assertSuccessAction(
        listAllFrameIdsCtx,
        "listAllFrameIds",
      );
      const frameIds = (listAllFrameIdsAction.result as { frameIds: string[] })
        .frameIds;
      assert.ok(frameIds.includes(mainFrameId));
      assert.deepEqual(
        [...frameIds].sort(),
        [...frames.map((frame) => frame.frameId)].sort(),
      );

      const getOrdinalCtx = await getPageRoute("getOrdinal", temp.sessionId, {
        frameId: mainFrameId,
      });
      const getOrdinalAction = assertSuccessAction(getOrdinalCtx, "getOrdinal");
      assert.equal(
        (getOrdinalAction.result as { frameId: string }).frameId,
        mainFrameId,
      );
      assert.ok((getOrdinalAction.result as { ordinal: number }).ordinal >= 0);

      const waitForMainLoadStateCtx = await postPageRoute(
        "waitForMainLoadState",
        temp.sessionId,
        {
          state: "load",
          timeoutMs: 15_000,
        },
      );
      assertSuccessAction(waitForMainLoadStateCtx, "waitForMainLoadState");

      const evaluateCtx = await postPageRoute("evaluate", temp.sessionId, {
        expression: `({
          title: document.title,
          cursorOverlay: !!document.getElementById("__v3_cursor_overlay__"),
          initValue: globalThis.__v4InitValue ?? null
        })`,
      });
      const evaluateAction = assertSuccessAction(evaluateCtx, "evaluate");
      assert.deepEqual(evaluateAction.result, {
        value: {
          title: "V4 header route",
          cursorOverlay: true,
          initValue: "present",
        },
      });
    } finally {
      await new Promise<void>((resolve, reject) => {
        server.close((error) => (error ? reject(error) : resolve()));
      });
      await endSession(temp.sessionId, headers);
    }
  });

  it("GET /v4/page/action/:actionId returns the new envelope for a stored action", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: GOTO_TEST_URL,
      waitUntil: "load",
    });
    const createdAction = assertSuccessAction(gotoCtx, "goto");

    const detailCtx = await fetchWithContext<PageActionResponse>(
      `${getBaseUrl()}/v4/page/action/${createdAction.id}?sessionId=${sessionId}`,
      {
        method: "GET",
        headers,
      },
    );

    assertFetchStatus(detailCtx, HTTP_OK);
    assertFetchOk(
      detailCtx.body !== null,
      "Expected a JSON response body",
      detailCtx,
    );
    assert.equal(detailCtx.body.success, true);
    assert.equal(detailCtx.body.error, null);
    assertFetchOk(
      detailCtx.body.action !== undefined,
      "Expected an action payload",
      detailCtx,
    );
    assert.equal(detailCtx.body.action.id, createdAction.id);
    assert.equal(detailCtx.body.action.method, "goto");
    assert.equal(detailCtx.body.action.sessionId, sessionId);
  });

  it("GET /v4/page/action returns the new envelope with action history", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: CLICK_TEST_URL,
      waitUntil: "load",
    });
    const gotoAction = assertSuccessAction(gotoCtx, "goto");

    const clickCtx = await postPageRoute("click", sessionId, {
      selector: {
        xpath: "//button[@id='click-target']",
      },
    });
    const clickAction = assertSuccessAction(clickCtx, "click");

    const listCtx = await fetchWithContext<PageActionResponse>(
      `${getBaseUrl()}/v4/page/action?sessionId=${sessionId}`,
      {
        method: "GET",
        headers,
      },
    );

    const actions = assertSuccessActionList(listCtx);
    const actionIds = new Set(actions.map((action) => action.id));

    assert.ok(actionIds.has(gotoAction.id), "Expected goto action in history");
    assert.ok(
      actionIds.has(clickAction.id),
      "Expected click action in history",
    );

    const listedClickAction = actions.find(
      (action) => action.id === clickAction.id,
    );
    assert.ok(listedClickAction, "Expected click action details in history");
    assert.equal(listedClickAction.method, "click");
    assert.equal(listedClickAction.sessionId, sessionId);
  });

  it("GET /v4/page/action still returns stored actions after the session ends", async () => {
    const temp = await createSessionWithCdp(headers);
    try {
      const gotoCtx = await postPageRoute("goto", temp.sessionId, {
        url: GOTO_TEST_URL,
        waitUntil: "load",
      });
      const action = assertSuccessAction(gotoCtx, "goto");

      await endSession(temp.sessionId, headers);

      const detailCtx = await fetchWithContext<PageActionResponse>(
        `${getBaseUrl()}/v4/page/action/${action.id}?sessionId=${temp.sessionId}`,
        {
          method: "GET",
          headers,
        },
      );
      const fetchedAction = assertSuccessAction(detailCtx, "goto");
      assert.equal(fetchedAction.id, action.id);

      const listCtx = await fetchWithContext<PageActionResponse>(
        `${getBaseUrl()}/v4/page/action?sessionId=${temp.sessionId}`,
        {
          method: "GET",
          headers,
        },
      );
      const actions = assertSuccessActionList(listCtx);
      assert.ok(actions.some((candidate) => candidate.id === action.id));
    } finally {
      await endSession(temp.sessionId, headers);
    }
  });

  it("POST /v4/page/click accepts css, text, and coordinate selector types", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: CLICK_TEST_URL,
      waitUntil: "load",
    });
    assertSuccessAction(gotoCtx, "goto");

    const cssSelectorCtx = await postPageRoute("click", sessionId, {
      selector: { css: "#click-target" },
    });
    assertSuccessAction(cssSelectorCtx, "click");

    const cssWithIndexCtx = await postPageRoute("click", sessionId, {
      selector: { css: "button", idx: 0 },
    });
    assertSuccessAction(cssWithIndexCtx, "click");

    const xpathWithIndexCtx = await postPageRoute("click", sessionId, {
      selector: { xpath: "//button", idx: 0 },
    });
    assertSuccessAction(xpathWithIndexCtx, "click");

    const textWithIndexCtx = await postPageRoute("click", sessionId, {
      selector: { text: "Submit", idx: 0 },
    });
    assertSuccessAction(textWithIndexCtx, "click");

    const textSelectorCtx = await postPageRoute("click", sessionId, {
      selector: { text: "Submit" },
    });
    assertSuccessAction(textSelectorCtx, "click");

    const coordSelectorCtx = await postPageRoute("click", sessionId, {
      selector: { x: 100, y: 200 },
    });
    assertSuccessAction(coordSelectorCtx, "click");
  });

  it("POST /v4/page/dragAndDrop accepts mixed selector types (xpath from, coordinates to)", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: METHODS_TEST_URL,
      waitUntil: "load",
    });
    assertSuccessAction(gotoCtx, "goto");

    const dragCtx = await postPageRoute("dragAndDrop", sessionId, {
      from: { xpath: "//div[@id='drag-source']" },
      to: { x: 200, y: 300 },
    });
    assertSuccessAction(dragCtx, "dragAndDrop");
  });

  it("POST /v4/page/click returns the new top-level failure shape for validation errors", async () => {
    const ctx = await postPageRoute("click", sessionId, {});

    assertFetchStatus(ctx, HTTP_BAD_REQUEST);
    assertFetchOk(ctx.body !== null, "Expected a JSON response body", ctx);
    assert.equal(ctx.body.success, false);
    assert.equal(ctx.body.statusCode, HTTP_BAD_REQUEST);
    assert.equal(typeof ctx.body.error, "string");
    assert.ok(ctx.body.error);
    assert.ok(
      ctx.body.stack === null || typeof ctx.body.stack === "string",
      "Expected stack to be null or a string",
    );
    assert.equal(ctx.body.action, undefined);
    assert.equal(ctx.body.actions, undefined);
  });

  it("POST /v4/page routes return the underlying error message and stack for route failures", async () => {
    const gotoCtx = await postPageRoute("goto", sessionId, {
      url: CLICK_TEST_URL,
      waitUntil: "load",
    });
    assertSuccessAction(gotoCtx, "goto");

    const ctx = await postPageRoute("click", sessionId, {
      selector: {
        xpath: "//button[@id='missing-target']",
      },
    });

    assertFetchStatus(ctx, 404);
    assertFetchOk(ctx.body !== null, "Expected a JSON response body", ctx);
    assert.equal(ctx.body.success, false);
    assert.equal(ctx.body.statusCode, 404);
    assert.equal(typeof ctx.body.error, "string");
    assert.ok(ctx.body.error);
    assert.equal(typeof ctx.body.stack, "string");
    assert.ok(ctx.body.stack);
    assertFetchOk(
      ctx.body.action !== undefined,
      "Expected a failed action payload",
      ctx,
    );
    assert.equal(ctx.body.action.status, "failed");
  });
});


================================================
FILE: packages/server-v4/tsconfig.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "outDir": "dist",
    "rootDir": "src",
    "module": "ESNext",
    "moduleResolution": "bundler",
    "verbatimModuleSyntax": false
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: packages/server-v4/tsconfig.tests.json
================================================
{
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "rootDir": "test",
    "outDir": "dist/tests",
    "declaration": false,
    "noEmit": false
  },
  "include": ["test/**/*.ts"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: packages/server-v4/vitest.config.ts
================================================
import { defineConfig } from "vitest/config";

export default defineConfig({
  test: {
    globals: true,
    environment: "node",
    include: ["test/**/*.test.ts"],
  },
});


================================================
FILE: pnpm-workspace.yaml
================================================
packages:
  - "packages/core"
  - "packages/cli"
  - "packages/evals"
  - "packages/docs"
  - "packages/server-v3"
  - "packages/server-v4"


================================================
FILE: stainless.yml
================================================
# yaml-language-server: $schema=https://app.stainless.com/config-internal.schema.json

##########################################################################
############ DO NOT EDIT THIS FILE IN THE STAINLESS STUDIO UI ############
############ !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! ############
############ ONLY EDIT IN browserbase/stagehand/stainless.yml ############
##########################################################################

edition: 2025-10-10

organization:
  name: stagehand
  docs: https://docs.stagehand.dev
  contact: ""

targets:
  python:
    edition: python.2025-11-20
    package_name: stagehand
    project_name: stagehand
    production_repo: browserbase/stagehand-python
    publish:
      pypi: true
  go:
    edition: go.2025-10-08
    package_name: stagehand
    production_repo: browserbase/stagehand-go
    options:
      enable_v2: true
  java:
    edition: java.2025-10-08
    reverse_domain: com.browserbase.api
    package_name: stagehand
    production_repo: browserbase/stagehand-java
    publish:
      maven:
        sonatype_platform: portal
  kotlin:
    edition: kotlin.2025-10-08
    reverse_domain: com.browserbase.api
    package_name: stagehand
    production_repo: browserbase/stagehand-kotlin
    publish:
      maven:
        sonatype_platform: portal
  ruby:
    edition: ruby.2025-10-08
    gem_name: stagehand
    production_repo: browserbase/stagehand-ruby
    publish:
      rubygems: false
  typescript:
    edition: typescript.2025-10-10
    package_name: stagehand-sdk
    production_repo: null
    publish:
      npm: false
    options:
      mcp_server: false
  php:
    edition: php.2025-10-08
    package_name: stagehand
    production_repo: browserbase/stagehand-php
    composer_package_name: browserbase/stagehand
    publish:
      packagist: true
  csharp:
    edition: csharp.2025-10-08
    package_name: stagehand
    production_repo: browserbase/stagehand-net
    publish:
      nuget: true
  # cli:
  #   edition: cli.2025-10-08
  #   binary_name: stagehand
  #   production_repo: browserbase/stagehand-cli

# `environments` are a map of the name of the environment (e.g. "sandbox",
# "production") to the corresponding url to use.
environments:
  production: https://api.stagehand.browserbase.com
  # dev: https://api.stagehand.dev.browserbase.com
  # local: http://stagehand-api.localhost

# OpenAPI transforms applied by Stainless during SDK generation.
# This keeps the generated `packages/server-v3/openapi.v3.yaml` faithful to the Fastify+Zod source,
# while still producing a Stainless-compatible spec for codegen.
openapi:
  code_samples: mintlify
  transforms:
    # Stainless doesn't support `propertyNames` (emitted by some JSON Schema generators).
    - command: remove
      reason: Remove unsupported JSON Schema keyword
      args:
        target: "$..propertyNames"

    # Empty-schema `additionalProperties: {}` is equivalent to `true`, and avoids Stainless issues.
    - command: update
      reason: Treat record value schema as any
      args:
        target: "$.components.schemas.BrowserbaseSessionCreateParams.properties.userMetadata.additionalProperties"
        value: true
    - command: update
      reason: Treat record value schema as any
      args:
        target: "$.components.schemas.BrowserbaseSessionCreateParamsOutput.properties.userMetadata.additionalProperties"
        value: true
    - command: update
      reason: Treat record value schema as any
      args:
        target: "$.components.schemas.ExtractRequest.properties.schema.additionalProperties"
        value: true
    - command: update
      reason: Treat record value schema as any
      args:
        target: "$.components.schemas.AgentResultData.properties.metadata.additionalProperties"
        value: true
    - command: update
      reason: Treat record value schema as any
      args:
        target: "$.components.schemas.AgentResultDataOutput.properties.metadata.additionalProperties"
        value: true
    - command: update
      reason: Treat passthrough schema as any
      args:
        target: "$.components.schemas.AgentAction.additionalProperties"
        value: true

    # Add a stable title to help Stainless infer a consistent name for this anonymous array schema.
    - command: merge
      reason: Improve name inference for anonymous arrays
      args:
        target: '$.components.schemas.BrowserbaseSessionCreateParams.properties.proxies.anyOf[?(@.type == "array")]'
        value:
          title: ProxyConfigList
    - command: merge
      reason: Improve name inference for anonymous arrays
      args:
        target: '$.components.schemas.BrowserbaseSessionCreateParamsOutput.properties.proxies.anyOf[?(@.type == "array")]'
        value:
          title: ProxyConfigList

    # `result` is intentionally untyped and should be treated as `any` in Stainless.
    - command: merge
      reason: Treat StreamEventSystemData.result as any
      args:
        target: "$.components.schemas.StreamEventSystemData.properties.result"
        value:
          x-stainless-any: true
    - command: merge
      reason: Treat StreamEventSystemDataOutput.result as any
      args:
        target: "$.components.schemas.StreamEventSystemDataOutput.properties.result"
        value:
          x-stainless-any: true

# `resources` define the structure and organization for your API, such as how
# methods and models are grouped together and accessed. See the [configuration
# guide] for more information.
#
# [configuration guide]: https://www.stainless.com/docs/guides/configure#resources
resources:
  sessions:
    models:
      action: "#/components/schemas/Action"
      model_config: "#/components/schemas/ModelConfig"
      stream_event: "#/components/schemas/StreamEvent"
    methods:
      start: post /v1/sessions/start
      act:
        endpoint: post /v1/sessions/{id}/act
        type: http
        streaming:
          param_discriminator: streamResponse
          stream_event_model: sessions.stream_event
          params_type_name: streamResponse
      extract:
        endpoint: post /v1/sessions/{id}/extract
        type: http
        streaming:
          param_discriminator: streamResponse
          stream_event_model: sessions.stream_event
          params_type_name: streamResponse
      observe:
        endpoint: post /v1/sessions/{id}/observe
        type: http
        streaming:
          param_discriminator: streamResponse
          stream_event_model: sessions.stream_event
          params_type_name: streamResponse
      execute:
        endpoint: post /v1/sessions/{id}/agentExecute
        type: http
        streaming:
          param_discriminator: streamResponse
          stream_event_model: sessions.stream_event
          params_type_name: streamResponse
      navigate: post /v1/sessions/{id}/navigate
      replay: get /v1/sessions/{id}/replay
      end: post /v1/sessions/{id}/end

streaming:
  on_event:
    - data_starts_with: '{"data":{"status":"finished"'
      handle: done
    - data_starts_with: error
      handle: error
    - event_type: null
      handle: yield

settings:
  # All generated integration tests that hit the prism mock http server are marked
  # as skipped. Removing this setting or setting it to false enables tests, but
  # doing so may result in test failures due to bugs in the test server.
  #
  # [prism mock http server]: https://stoplight.io/open-source/prism
  disable_mock_tests: true
  license: MIT

# `client_settings` define settings for the API client, such as extra constructor
# arguments (used for authentication), retry behavior, idempotency, etc.
client_settings:
  opts:
    BROWSERBASE_API_KEY:
      type: string
      read_env: BROWSERBASE_API_KEY
      description: Your [Browserbase API Key](https://www.browserbase.com/settings)
      nullable: false
      auth:
        security_scheme: BBApiKeyAuth
    BROWSERBASE_PROJECT_ID:
      type: string
      read_env: BROWSERBASE_PROJECT_ID
      description: Your [Browserbase Project ID](https://www.browserbase.com/settings)
      nullable: false
      auth:
        security_scheme: BBProjectIdAuth
    MODEL_API_KEY:
      type: string
      read_env: MODEL_API_KEY
      description: Your LLM provider API key (e.g. OPENAI_API_KEY, ANTHROPIC_API_KEY, etc.)
      nullable: false
      auth:
        security_scheme: LLMModelApiKeyAuth

security_schemes:
  BBApiKeyAuth:
    type: apiKey
    in: header
    name: x-bb-api-key
  BBProjectIdAuth:
    type: apiKey
    in: header
    name: x-bb-project-id
  LLMModelApiKeyAuth:
    type: apiKey
    in: header
    name: x-model-api-key

security:
  - BBApiKeyAuth: []
    BBProjectIdAuth: []
    LLMModelApiKeyAuth: []

# `readme` is used to configure the code snippets that will be rendered in the
# README.md of various SDKs.
readme:
  example_requests:
    default:
      type: request
      endpoint: post /v1/sessions/start
      params:
        modelName: "openai/gpt-5-nano"
    headline:
      type: request
      endpoint: post /v1/sessions/{id}/act
      params:
        input: "click the first link on the page"
        id: "00000000-your-session-id-000000000000"

diagnostics:
  ignored:
    Ruby/NameNotAllowed: true
    Ruby/NameShadowedBuiltin: true


================================================
FILE: tsconfig.base.json
================================================
{
  "compilerOptions": {
    "target": "ES2022",
    "esModuleInterop": true,
    "allowSyntheticDefaultImports": true,
    "noImplicitAny": true,
    "module": "ESNext",
    "moduleResolution": "node",
    "sourceMap": true,
    "inlineSources": true,
    "declaration": true,
    "skipLibCheck": true
  }
}


================================================
FILE: tsconfig.json
================================================
{
  "extends": "./tsconfig.base.json",
  "compilerOptions": {
    "outDir": "dist",
    "baseUrl": ".",
    "paths": {
      "*": ["node_modules/*", "packages/core/lib/types/*"],
      "@/*": ["./*"]
    }
  },
  "exclude": ["node_modules", "dist", ".eslintrc.cjs"]
}


================================================
FILE: turbo.json
================================================
{
  "$schema": "https://v2-8-10.turborepo.dev/schema.json",
  "globalEnv": [
    "CI"
  ],
  "globalDependencies": [
    ".github/workflows/ci.yml",
    "package.json",
    "packages/*/package.json",
    "tsconfig.json",
    "tsconfig.base.json",
    "eslint.config.mjs",
    ".prettierrc",
    ".prettierignore"
  ],
  "tasks": {
    "build": {
      "dependsOn": ["^build"],
      "outputs": [
        "dist/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/**"
      ]
    },
    "@browserbasehq/stagehand#build": {
      "dependsOn": [
        "^build",
        "gen-version",
        "build-dom-scripts:dom",
        "build-dom-scripts:locator",
        "build-dom-scripts:screenshot",
        "build-dom-scripts:a11y"
      ],
      "outputs": [
        "dist/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!lib/version.ts",
        "!lib/dom/build/**",
        "!lib/v3/dom/build/**",
        "!dist/**"
      ]
    },
    "@browserbasehq/stagehand-server-v3#build": {
      "dependsOn": ["^build"],
      "outputs": [
        "dist/**",
        "openapi.v3.yaml"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/**",
        "!openapi.v3.yaml"
      ]
    },
    "@browserbasehq/stagehand-server-v4#build": {
      "dependsOn": ["^build"],
      "outputs": [
        "dist/**",
        "openapi.v4.yaml"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/**",
        "!openapi.v4.yaml"
      ]
    },
    "@browserbasehq/browse-cli#build": {
      "dependsOn": ["^build"],
      "outputs": [
        "dist/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsup.config.ts",
        "!dist/**"
      ]
    },
    "@browserbasehq/stagehand-server-v4#gen:openapi": {
      "dependsOn": ["^build:esm"],
      "outputs": ["openapi.v4.yaml"],
      "inputs": [
        "src/**/*.ts",
        "scripts/gen-openapi.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!openapi.v4.yaml"
      ]
    },
    "@browserbasehq/stagehand#build:esm": {
      "dependsOn": [
        "^build:esm",
        "gen-version",
        "build-dom-scripts:dom",
        "build-dom-scripts:locator",
        "build-dom-scripts:screenshot",
        "build-dom-scripts:a11y"
      ],
      "outputs": [
        "dist/esm/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!lib/version.ts",
        "!lib/dom/build/**",
        "!lib/v3/dom/build/**",
        "!dist/**"
      ]
    },
    "@browserbasehq/stagehand#build:cjs": {
      "dependsOn": [
        "^build:cjs",
        "gen-version",
        "build-dom-scripts:dom",
        "build-dom-scripts:locator",
        "build-dom-scripts:screenshot",
        "build-dom-scripts:a11y"
      ],
      "outputs": [
        "dist/cjs/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!lib/version.ts",
        "!lib/dom/build/**",
        "!lib/v3/dom/build/**",
        "!dist/**"
      ]
    },
    "gen-version": {
      "outputs": ["lib/version.ts"],
      "inputs": [
        "scripts/gen-version.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!lib/version.ts"
      ]
    },
    "build-dom-scripts:dom": {
      "outputs": [
        "lib/v3/dom/build/v3-index.js",
        "lib/v3/dom/build/scriptV3Content.ts",
        "lib/v3/dom/build/rerender-index.js",
        "lib/v3/dom/build/reRenderScriptContent.ts"
      ],
      "inputs": [
        "lib/v3/dom/genDomScripts.ts",
        "lib/v3/dom/**/*.ts",
        "!lib/v3/dom/build/**",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "build-dom-scripts:locator": {
      "outputs": [
        "lib/v3/dom/build/locatorScripts.generated.ts"
      ],
      "inputs": [
        "lib/v3/dom/genLocatorScripts.ts",
        "lib/v3/dom/locatorScripts/**/*.ts",
        "!lib/v3/dom/build/**",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "build-dom-scripts:screenshot": {
      "outputs": [
        "lib/v3/dom/build/screenshotScripts.generated.ts"
      ],
      "inputs": [
        "lib/v3/dom/genScreenshotScripts.ts",
        "lib/v3/dom/screenshotScripts/**/*.ts",
        "!lib/v3/dom/build/**",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "build-dom-scripts:a11y": {
      "outputs": [
        "lib/v3/dom/build/a11yScripts.generated.ts"
      ],
      "inputs": [
        "lib/v3/dom/genA11yScripts.ts",
        "lib/v3/dom/a11yScripts/**/*.ts",
        "!lib/v3/dom/build/**",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "build:esm": {
      "dependsOn": ["^build:esm"],
      "outputs": [
        "dist/esm/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/esm/**"
      ]
    },
    "build:esm-tests": {
      "dependsOn": ["^build:esm"],
      "outputs": ["dist/tests/**"],
      "inputs": [
        "test/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/tests/**"
      ]
    },
    "build:server:dist": {
      "dependsOn": ["^build:esm"],
      "outputs": [
        "dist/lib/**",
        "dist/routes/**",
        "dist/types/**",
        "dist/*.js",
        "dist/*.js.map",
        "dist/*.d.ts"
      ],
      "inputs": [
        "src/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/lib/**",
        "!dist/routes/**",
        "!dist/types/**",
        "!dist/*.js",
        "!dist/*.js.map",
        "!dist/*.d.ts"
      ]
    },
    "gen:openapi": {
      "dependsOn": ["^build:esm"],
      "outputs": ["openapi.v3.yaml"],
      "inputs": [
        "src/**/*.ts",
        "scripts/gen-openapi.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!openapi.v3.yaml"
      ]
    },
    "build:sea:esm": {
      "dependsOn": ["^build:esm"],
      "outputs": [
        "dist/sea/**",
        "dist/app.mjs"
      ],
      "env": [
        "SEA_BUILD_MODE",
        "SEA_TARGET_PLATFORM",
        "SEA_TARGET_ARCH",
        "SEA_BINARY_NAME"
      ],
      "inputs": [
        "src/**/*.ts",
        "scripts/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/sea/**",
        "!dist/app.mjs"
      ]
    },
    "build:sea:cjs": {
      "dependsOn": ["^build:cjs"],
      "outputs": ["dist/sea/**"],
      "env": [
        "SEA_BUILD_MODE",
        "SEA_TARGET_PLATFORM",
        "SEA_TARGET_ARCH",
        "SEA_BINARY_NAME"
      ],
      "inputs": [
        "src/**/*.ts",
        "scripts/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/sea/**"
      ]
    },
    "build:cjs": {
      "dependsOn": ["^build:cjs"],
      "outputs": [
        "dist/cjs/**"
      ],
      "inputs": [
        "**/*.ts",
        "**/*.js",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/cjs/**"
      ]
    },
    "build:cli": {
      "dependsOn": ["^build:esm"],
      "outputs": ["dist/cli/**"],
      "inputs": [
        "cli.ts",
        "evals.config.json",
        "scripts/**",
        "!dist/cli/**"
      ]
    },
    "lint": {
      "dependsOn": ["^build"],
      "outputs": [],
      "inputs": [
        "**/*.ts",
        "**/*.tsx",
        "**/*.js",
        "**/*.jsx",
        "**/*.mjs",
        "**/*.cjs",
        "**/*.mts",
        "**/*.cts",
        "**/*.md",
        "**/*.mdx",
        "**/*.yml",
        "**/*.yaml",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!dist/**",
        "!node_modules/**",
        "!.turbo/**"
      ]
    },
    "format": {
      "outputs": [],
      "cache": false
    },
    "test": {
      "dependsOn": [],
      "outputs": [],
      "inputs": [
        "**/*.spec.ts",
        "**/*.test.ts"
      ]
    },
    "test:core": {
      "dependsOn": ["build:esm"],
      "outputs": [],
      "cache": false,
      "env": [
        "BROWSERBASE_FLOW_LOGS",
        "VITEST_CONSOLE_REPORTER"
      ],
      "inputs": [
        "tests/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "test:e2e": {
      "dependsOn": ["build:esm"],
      "outputs": [
        "playwright-report/**",
        "test-results/**"
      ],
      "cache": false,
      "env": [
        "BB_API_KEY",
        "BB_PROJECT_ID",
        "BROWSERBASE_REGION",
        "BROWSERBASE_SESSION_LIMIT_PER_E2E_TEST",
        "IFRAME_CHILD_FRAME_TIMEOUT_MS",
        "IFRAME_DEBUG",
        "IFRAME_POPUP_TIMEOUT_MS",
        "IFRAME_POPUP_URL_TIMEOUT_MS",
        "KEEP_ALIVE_ACTION_EXIT_TIMEOUT_MS",
        "KEEP_ALIVE_BB_INFO_TIMEOUT_MS",
        "KEEP_ALIVE_BB_TIMEOUT_MS",
        "KEEP_ALIVE_DEBUG",
        "KEEP_ALIVE_LOCAL_INFO_TIMEOUT_MS",
        "KEEP_ALIVE_LOCAL_TIMEOUT_MS",
        "KEEP_ALIVE_STAY_OPEN_MS",
        "KEEP_ALIVE_VIEW_MS",
        "LOCAL_SESSION_LIMIT_PER_E2E_TEST",
        "PLAYWRIGHT_CONSOLE_REPORTER",
        "STAGEHAND_BROWSER_TARGET",
        "STAGEHAND_API_URL"
      ],
      "passThroughEnv": [
        "ANTHROPIC_API_KEY",
        "BROWSERBASE_API_KEY",
        "BROWSERBASE_CDP_CONNECT_MAX_MS",
        "BROWSERBASE_PROJECT_ID",
        "BROWSERBASE_SESSION_CREATE_MAX_MS",
        "CHROME_PATH",
        "CTRF_JUNIT_PATH",
        "GEMINI_API_KEY",
        "GOOGLE_GENERATIVE_AI_API_KEY",
        "HEADLESS",
        "LLM_MAX_MS",
        "NODE_OPTIONS",
        "NODE_V8_COVERAGE",
        "OPENAI_API_KEY",
        "STAGEHAND_SERVER_TARGET"
      ],
      "inputs": [
        "lib/v3/tests/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json",
        "!playwright-report/**",
        "!test-results/**"
      ]
    },
    "test:evals": {
      "dependsOn": ["build:esm", "build:cli"],
      "outputs": [],
      "cache": false,
      "env": [
        "AGENT_EVAL_MAX_STEPS",
        "BRAINTRUST_API_KEY",
        "EVAL_AGENT_MODELS",
        "EVAL_AGENT_MODELS_CUA",
        "EVAL_CATEGORIES",
        "EVAL_DATASET",
        "EVAL_ENV",
        "EVAL_GAIA_FILE",
        "EVAL_GAIA_LEVEL",
        "EVAL_GAIA_LIMIT",
        "EVAL_GAIA_SAMPLE",
        "EVAL_MAX_CONCURRENCY",
        "EVAL_MAX_K",
        "EVAL_MODELS",
        "EVAL_ONLINEMIND2WEB_LIMIT",
        "EVAL_ONLINEMIND2WEB_SAMPLE",
        "EVAL_PROVIDER",
        "EVAL_TRIAL_COUNT",
        "EVAL_WEBVOYAGER_LIMIT",
        "EVAL_WEBVOYAGER_SAMPLE",
        "OP_AUTO_ENV_DISABLE",
        "OP_ENV_FILE",
        "STAGEHAND_BROWSER_TARGET",
        "USE_API"
      ],
      "passThroughEnv": [
        "ANTHROPIC_API_KEY",
        "BROWSERBASE_API_KEY",
        "BROWSERBASE_CDP_CONNECT_MAX_MS",
        "BROWSERBASE_PROJECT_ID",
        "BROWSERBASE_SESSION_CREATE_MAX_MS",
        "CHROME_PATH",
        "CTRF_JUNIT_PATH",
        "GEMINI_API_KEY",
        "GOOGLE_GENERATIVE_AI_API_KEY",
        "HEADLESS",
        "LLM_MAX_MS",
        "NODE_OPTIONS",
        "NODE_V8_COVERAGE",
        "OPENAI_API_KEY",
        "STAGEHAND_SERVER_TARGET"
      ],
      "inputs": [
        "scripts/**",
        "cli.ts",
        "evals.config.json",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "test:server": {
      "dependsOn": ["build:sea:esm", "build:esm-tests"],
      "outputs": [],
      "cache": false,
      "env": [
        "BB_ENV",
        "NODE_ENV",
        "NODE_TEST_CONSOLE_REPORTER",
        "NODE_TEST_REPORTER",
        "NODE_TEST_REPORTER_DESTINATION",
        "SEA_BINARY_NAME",
        "STAGEHAND_BASE_URL",
        "STAGEHAND_SEA_CACHE_DIR",
        "STAGEHAND_TEST_LOCAL_CONNECT_TIMEOUT_MS"
      ],
      "passThroughEnv": [
        "ANTHROPIC_API_KEY",
        "BROWSERBASE_API_KEY",
        "BROWSERBASE_CDP_CONNECT_MAX_MS",
        "BROWSERBASE_PROJECT_ID",
        "BROWSERBASE_SESSION_CREATE_MAX_MS",
        "CHROME_PATH",
        "CTRF_JUNIT_PATH",
        "GEMINI_API_KEY",
        "GOOGLE_GENERATIVE_AI_API_KEY",
        "HEADLESS",
        "LLM_MAX_MS",
        "NODE_OPTIONS",
        "NODE_V8_COVERAGE",
        "OPENAI_API_KEY",
        "STAGEHAND_BROWSER_TARGET",
        "STAGEHAND_SERVER_TARGET"
      ],
      "inputs": [
        "test/**/*.ts",
        "scripts/**",
        "src/**/*.ts",
        "package.json",
        "tsconfig.json",
        "tsconfig.*.json"
      ]
    },
    "test:cli": {
      "dependsOn": ["build"],
      "outputs": [],
      "cache": false,
      "inputs": [
        "tests/**/*.ts",
        "src/**/*.ts",
        "package.json",
        "tsconfig.json",
        "vitest.config.ts"
      ]
    },
    "docs": {
      "persistent": true,
      "cache": false
    },
    "dev": {
      "persistent": true,
      "cache": false
    }
  }
}