From 0b4c05227f5bed2d090d17957f319151df8221f8 Mon Sep 17 00:00:00 2001 From: tkattkat Date: Tue, 31 Mar 2026 12:42:19 -0700 Subject: [PATCH 1/4] Update docs / logging to reflect gpt 5.4 and gemini 3.1 family compatability with agent hybrid mode --- .changeset/tricky-bats-pay.md | 5 +++++ packages/core/lib/v3/handlers/v3AgentHandler.ts | 2 ++ packages/docs/v3/basics/agent.mdx | 5 +++-- packages/docs/v3/references/agent.mdx | 5 +++-- 4 files changed, 13 insertions(+), 4 deletions(-) create mode 100644 .changeset/tricky-bats-pay.md diff --git a/.changeset/tricky-bats-pay.md b/.changeset/tricky-bats-pay.md new file mode 100644 index 0000000000..1f0545b55b --- /dev/null +++ b/.changeset/tricky-bats-pay.md @@ -0,0 +1,5 @@ +--- +"@browserbasehq/stagehand": patch +--- + +Update docs / logging to reflect gpt 5.4 and gemini 3.1 family compatability with agent hybrid mode diff --git a/packages/core/lib/v3/handlers/v3AgentHandler.ts b/packages/core/lib/v3/handlers/v3AgentHandler.ts index eda528df5b..6ee953d0c9 100644 --- a/packages/core/lib/v3/handlers/v3AgentHandler.ts +++ b/packages/core/lib/v3/handlers/v3AgentHandler.ts @@ -166,6 +166,8 @@ export class V3AgentHandler { if ( this.mode === "hybrid" && !baseModel.modelId.includes("gemini-3-flash") && + !baseModel.modelId.includes("gemini-3.1") && + !baseModel.modelId.includes("gpt-5.4") && !baseModel.modelId.includes("claude") ) { this.logger({ diff --git a/packages/docs/v3/basics/agent.mdx b/packages/docs/v3/basics/agent.mdx index f3274b110a..58b5856f5d 100644 --- a/packages/docs/v3/basics/agent.mdx +++ b/packages/docs/v3/basics/agent.mdx @@ -137,8 +137,9 @@ Both DOM and CUA modes have their strengths and weaknesses. Hybrid mode combines **Model Requirements:** Hybrid mode requires models that can reliably perform coordinate-based actions from screenshots. The following models are recommended: -- **Google:** `google/gemini-3-flash-preview` -- **Anthropic:** `anthropic/claude-sonnet-4-20250514`, `anthropic/claude-sonnet-4-5-20250929`, `anthropic/claude-haiku-4-5-20251001` +- **Google:** `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-live-preview`, `google/gemini-3.1-pro-preview` +- **OpenAI:** `openai/gpt-5.4`, `openai/gpt-5.4-mini` +- **Anthropic:** Any `anthropic/claude-*` model Other models may not reliably produce accurate coordinates for clicking and typing. diff --git a/packages/docs/v3/references/agent.mdx b/packages/docs/v3/references/agent.mdx index be702649ff..959f05e598 100644 --- a/packages/docs/v3/references/agent.mdx +++ b/packages/docs/v3/references/agent.mdx @@ -131,8 +131,9 @@ interface AgentInstance { **Hybrid Mode Model Requirements:** Only use hybrid mode with models that can reliably perform coordinate-based actions: - - **Google:** `google/gemini-3-flash-preview` - - **Anthropic:** `anthropic/claude-sonnet-4-20250514`, `anthropic/claude-sonnet-4-5-20250929`, `anthropic/claude-haiku-4-5-20251001` + - **Google:** `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-live-preview`, `google/gemini-3.1-pro-preview` + - **OpenAI:** `openai/gpt-5.4`, `openai/gpt-5.4-mini` + - **Anthropic:** Any `anthropic/claude-*` model Requires `experimental: true` in Stagehand constructor. From c75e4724320e9dee66589c8bc568a64f1c411be0 Mon Sep 17 00:00:00 2001 From: tkattkat Date: Tue, 31 Mar 2026 12:45:15 -0700 Subject: [PATCH 2/4] update claude.md --- claude.md | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/claude.md b/claude.md index fcffa95b41..19f64807c7 100644 --- a/claude.md +++ b/claude.md @@ -238,8 +238,9 @@ Hybrid mode uses both DOM-based and coordinate-based tools (act, click, type, dr **Recommended models for hybrid mode:** -- `google/gemini-3-flash-preview` -- `anthropic/claude-sonnet-4-20250514`, `anthropic/claude-sonnet-4-5-20250929`, `anthropic/claude-haiku-4-5-20251001` +- `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-live-preview`, `google/gemini-3.1-pro-preview` +- `openai/gpt-5.4`, `openai/gpt-5.4-mini` +- Any `anthropic/claude-*` model ```typescript const stagehand = new Stagehand({ From 7a84b4347406affe544965d695aa2d0c2496c162 Mon Sep 17 00:00:00 2001 From: tkattkat <48974763+tkattkat@users.noreply.github.com> Date: Tue, 31 Mar 2026 15:30:50 -0700 Subject: [PATCH 3/4] Fix typo in compatibility documentation --- .changeset/tricky-bats-pay.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.changeset/tricky-bats-pay.md b/.changeset/tricky-bats-pay.md index 1f0545b55b..5eee2902b1 100644 --- a/.changeset/tricky-bats-pay.md +++ b/.changeset/tricky-bats-pay.md @@ -2,4 +2,4 @@ "@browserbasehq/stagehand": patch --- -Update docs / logging to reflect gpt 5.4 and gemini 3.1 family compatability with agent hybrid mode +Update docs / logging to reflect gpt 5.4 and gemini 3.1 family compatibility with agent hybrid mode From e89ead4fed4788558c5d138027a0dec0730c32c8 Mon Sep 17 00:00:00 2001 From: tkattkat Date: Mon, 6 Apr 2026 16:25:19 -0700 Subject: [PATCH 4/4] update incorrect model name --- claude.md | 2 +- packages/docs/v3/basics/agent.mdx | 2 +- packages/docs/v3/references/agent.mdx | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/claude.md b/claude.md index 19f64807c7..c784f88a19 100644 --- a/claude.md +++ b/claude.md @@ -238,7 +238,7 @@ Hybrid mode uses both DOM-based and coordinate-based tools (act, click, type, dr **Recommended models for hybrid mode:** -- `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-live-preview`, `google/gemini-3.1-pro-preview` +- `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-lite-preview`, `google/gemini-3.1-pro-preview` - `openai/gpt-5.4`, `openai/gpt-5.4-mini` - Any `anthropic/claude-*` model diff --git a/packages/docs/v3/basics/agent.mdx b/packages/docs/v3/basics/agent.mdx index 58b5856f5d..3500471499 100644 --- a/packages/docs/v3/basics/agent.mdx +++ b/packages/docs/v3/basics/agent.mdx @@ -137,7 +137,7 @@ Both DOM and CUA modes have their strengths and weaknesses. Hybrid mode combines **Model Requirements:** Hybrid mode requires models that can reliably perform coordinate-based actions from screenshots. The following models are recommended: -- **Google:** `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-live-preview`, `google/gemini-3.1-pro-preview` +- **Google:** `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-lite-preview`, `google/gemini-3.1-pro-preview` - **OpenAI:** `openai/gpt-5.4`, `openai/gpt-5.4-mini` - **Anthropic:** Any `anthropic/claude-*` model diff --git a/packages/docs/v3/references/agent.mdx b/packages/docs/v3/references/agent.mdx index 959f05e598..65d3e9aa7c 100644 --- a/packages/docs/v3/references/agent.mdx +++ b/packages/docs/v3/references/agent.mdx @@ -131,7 +131,7 @@ interface AgentInstance { **Hybrid Mode Model Requirements:** Only use hybrid mode with models that can reliably perform coordinate-based actions: - - **Google:** `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-live-preview`, `google/gemini-3.1-pro-preview` + - **Google:** `google/gemini-3-flash-preview`, `google/gemini-3.1-flash-lite-preview`, `google/gemini-3.1-pro-preview` - **OpenAI:** `openai/gpt-5.4`, `openai/gpt-5.4-mini` - **Anthropic:** Any `anthropic/claude-*` model