browserbase
diff --git a/‎.changeset/quick-games-try.md‎
Lines changed: 5 additions & 0 deletions b/‎.changeset/quick-games-try.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎packages/core/lib/v3/agent/prompts/agentSystemPrompt.ts‎
Lines changed: 0 additions & 4 deletions b/‎packages/core/lib/v3/agent/prompts/agentSystemPrompt.ts‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎packages/core/lib/v3/agent/tools/close.ts‎
Lines changed: 0 additions & 16 deletions b/‎packages/core/lib/v3/agent/tools/close.ts‎
Lines changed: 0 additions & 16 deletions
diff --git a/‎packages/core/lib/v3/agent/tools/index.ts‎
Lines changed: 1 addition & 3 deletions b/‎packages/core/lib/v3/agent/tools/index.ts‎
Lines changed: 1 addition & 3 deletions
diff --git a/‎packages/core/lib/v3/agent/utils/handleCloseToolCall.ts‎
Lines changed: 128 additions & 0 deletions b/‎packages/core/lib/v3/agent/utils/handleCloseToolCall.ts‎
Lines changed: 128 additions & 0 deletions
diff --git a/‎packages/core/lib/v3/agent/utils/validateExperimentalFeatures.ts‎
Lines changed: 8 additions & 2 deletions b/‎packages/core/lib/v3/agent/utils/validateExperimentalFeatures.ts‎
Lines changed: 8 additions & 2 deletions
@@ -0,0 +1,5 @@
+---
+"@browserbasehq/stagehand": patch
+---
+
+Add structured output to agent result + ensure close tool is always called
@@ -67,7 +67,6 @@ function buildToolsSection(
     { name: "wait", description: "Wait for a specified time" },
     { name: "navback", description: "Navigate back in browser history" },
     { name: "scroll", description: "Scroll the page x pixels up or down" },
-    { name: "close", description: "Mark the task as complete or failed" },
   ];
 
   const domTools: ToolDefinition[] = [
@@ -92,7 +91,6 @@ function buildToolsSection(
     { name: "wait", description: "Wait for a specified time" },
     { name: "navback", description: "Navigate back in browser history" },
     { name: "scroll", description: "Scroll the page x pixels up or down" },
-    { name: "close", description: "Mark the task as complete or failed" },
   ];
 
   const baseTools = isHybridMode ? hybridTools : domTools;
@@ -224,8 +222,6 @@ export function buildAgentSystemPrompt(
     <item>Always start by understanding the current page state</item>
     <item>Use the screenshot tool to verify page state when needed</item>
     <item>Use appropriate tools for each action</item>
-    <item>When the task is complete, use the "close" tool with taskComplete: true</item>
-    <item>If the task cannot be completed, use "close" with taskComplete: false</item>
   </guidelines>
   ${pageUnderstandingProtocol}
   <navigation>
 
@@ -3,7 +3,6 @@ import { actTool } from "./act";
 import { screenshotTool } from "./screenshot";
 import { waitTool } from "./wait";
 import { navBackTool } from "./navback";
-import { closeTool } from "./close";
 import { ariaTreeTool } from "./ariaTree";
 import { fillFormTool } from "./fillform";
 import { scrollTool, scrollVisionTool } from "./scroll";
@@ -87,7 +86,7 @@ export function createAgentTools(v3: V3, options?: V3AgentToolOptions) {
     ariaTree: ariaTreeTool(v3),
     click: clickTool(v3, provider),
     clickAndHold: clickAndHoldTool(v3, provider),
-    close: closeTool(),
+    //close: closeTool(),
     dragAndDrop: dragAndDropTool(v3, provider),
     extract: extractTool(v3, executionModel, options?.logger),
     fillForm: fillFormTool(v3, executionModel),
@@ -121,7 +120,6 @@ export type AgentToolTypesMap = {
   ariaTree: ReturnType<typeof ariaTreeTool>;
   click: ReturnType<typeof clickTool>;
   clickAndHold: ReturnType<typeof clickAndHoldTool>;
-  close: ReturnType<typeof closeTool>;
   dragAndDrop: ReturnType<typeof dragAndDropTool>;
   extract: ReturnType<typeof extractTool>;
   fillForm: ReturnType<typeof fillFormTool>;
 
@@ -0,0 +1,128 @@
+import { generateText, ModelMessage, LanguageModel, ToolSet } from "ai";
+import { z } from "zod";
+import { tool } from "ai";
+import { LogLine } from "../../types/public/logs";
+import { StagehandZodObject } from "../../zodCompat";
+interface CloseResult {
+  reasoning: string;
+  taskComplete: boolean;
+  messages: ModelMessage[];
+  output?: Record<string, unknown>;
+}
+
+const baseCloseSchema = z.object({
+  reasoning: z
+    .string()
+    .describe("Brief summary of what actions were taken and the outcome"),
+  taskComplete: z
+    .boolean()
+    .describe("true if the task was fully completed, false otherwise"),
+});
+
+/**
+ * Force a close tool call at the end of an agent run.
+ * This ensures we always get a structured final response,
+ * even if the main loop ended without calling close.
+ */
+export async function handleCloseToolCall(options: {
+  model: LanguageModel;
+  inputMessages: ModelMessage[];
+  instruction: string;
+  outputSchema?: StagehandZodObject;
+  logger: (message: LogLine) => void;
+}): Promise<CloseResult> {
+  const { model, inputMessages, instruction, outputSchema, logger } = options;
+
+  logger({
+    category: "agent",
+    message: "Agent calling tool: close",
+    level: 1,
+  });
+  // Merge base close schema with user-provided output schema if present
+  const closeToolSchema = outputSchema
+    ? baseCloseSchema.extend({
+        output: outputSchema.describe(
+          "The specific data the user requested from this task",
+        ),
+      })
+    : baseCloseSchema;
+
+  const outputInstructions = outputSchema
+    ? `\n\nThe user also requested the following information from this task. Provide it in the "output" field:\n${JSON.stringify(
+        Object.fromEntries(
+          Object.entries(outputSchema.shape).map(([key, value]) => [
+            key,
+            value.description || "no description",
+          ]),
+        ),
+        null,
+        2,
+      )}`
+    : "";
+
+  const systemPrompt = `You are a web automation assistant that was tasked with completing a task.
+
+The task was:
+"${instruction}"
+
+Review what was accomplished and provide your final assessment in whether the task was completed successfully. you have been provided with the history of the actions taken so far, use this to determine if the task was completed successfully.${outputInstructions}
+
+Call the "close" tool with:
+1. A brief summary of what was done
+2. Whether the task was completed successfully${outputSchema ? "\n3. The requested output data based on what you found" : ""}`;
+
+  const closeTool = tool({
+    description: outputSchema
+      ? "Complete the task with your assessment and the requested output data."
+      : "Complete the task with your final assessment.",
+    inputSchema: closeToolSchema,
+    execute: async (params) => {
+      return { success: true, ...params };
+    },
+  });
+
+  const userPrompt: ModelMessage = {
+    role: "user",
+    content: outputSchema
+      ? "Provide your final assessment and the requested output data."
+      : "Provide your final assessment.",
+  };
+
+  const result = await generateText({
+    model,
+    system: systemPrompt,
+    messages: [...inputMessages, userPrompt],
+    tools: { close: closeTool } as ToolSet,
+    toolChoice: { type: "tool", toolName: "close" },
+  });
+
+  const closeToolCall = result.toolCalls.find((tc) => tc.toolName === "close");
+  const outputMessages: ModelMessage[] = [
+    userPrompt,
+    ...(result.response?.messages || []),
+  ];
+
+  if (!closeToolCall) {
+    return {
+      reasoning: result.text || "Task execution completed",
+      taskComplete: false,
+      messages: outputMessages,
+    };
+  }
+
+  const input = closeToolCall.input as z.infer<typeof baseCloseSchema> & {
+    output?: Record<string, unknown>;
+  };
+  logger({
+    category: "agent",
+    message: `Task completed`,
+    level: 1,
+  });
+
+  return {
+    reasoning: input.reasoning,
+    taskComplete: input.taskComplete,
+    messages: outputMessages,
+    output: input.output,
+  };
+}
@@ -21,10 +21,10 @@ export interface AgentValidationOptions {
  * Validates agent configuration and experimental feature usage.
  *
  * This utility consolidates all validation checks for both CUA and non-CUA agent paths:
- * - Invalid argument errors for CUA (streaming, abort signal, message continuation, excludeTools are not supported)
+ * - Invalid argument errors for CUA (streaming, abort signal, message continuation, excludeTools, output schema are not supported)
  * - Experimental feature checks for integrations and tools (both CUA and non-CUA)
  * - Experimental feature checks for hybrid mode (requires experimental: true)
- * - Experimental feature checks for non-CUA only (callbacks, signal, messages, streaming, excludeTools)
+ * - Experimental feature checks for non-CUA only (callbacks, signal, messages, streaming, excludeTools, output schema)
  *
  * Throws StagehandInvalidArgumentError for invalid/unsupported configurations.
  * Throws ExperimentalNotConfiguredError if experimental features are used without experimental mode.
@@ -56,6 +56,9 @@ export function validateExperimentalFeatures(
     ) {
       unsupportedFeatures.push("excludeTools");
     }
+    if (executeOptions?.output) {
+      unsupportedFeatures.push("output schema");
+    }
 
     if (unsupportedFeatures.length > 0) {
       throw new StagehandInvalidArgumentError(
@@ -97,6 +100,9 @@ export function validateExperimentalFeatures(
     if (executeOptions.excludeTools && executeOptions.excludeTools.length > 0) {
       features.push("excludeTools");
     }
+    if (executeOptions.output) {
+      features.push("output schema");
+    }
   }
 
   if (features.length > 0) {
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +---
 +"@browserbasehq/stagehand": patch
 +---
++
 +Add structured output to agent result + ensure close tool is always called
Original file line number	Diff line number	Diff line change
`@@ -21,10 +21,10 @@ export interface AgentValidationOptions {`
`21`	`21`	`* Validates agent configuration and experimental feature usage.`
`22`	`22`	`*`
`23`	`23`	`* This utility consolidates all validation checks for both CUA and non-CUA agent paths:`
`24`		`- * - Invalid argument errors for CUA (streaming, abort signal, message continuation, excludeTools are not supported)`
	`24`	`+ * - Invalid argument errors for CUA (streaming, abort signal, message continuation, excludeTools, output schema are not supported)`
`25`	`25`	`* - Experimental feature checks for integrations and tools (both CUA and non-CUA)`
`26`	`26`	`* - Experimental feature checks for hybrid mode (requires experimental: true)`
`27`		`- * - Experimental feature checks for non-CUA only (callbacks, signal, messages, streaming, excludeTools)`
	`27`	`+ * - Experimental feature checks for non-CUA only (callbacks, signal, messages, streaming, excludeTools, output schema)`
`28`	`28`	`*`
`29`	`29`	`* Throws StagehandInvalidArgumentError for invalid/unsupported configurations.`
`30`	`30`	`* Throws ExperimentalNotConfiguredError if experimental features are used without experimental mode.`
`@@ -56,6 +56,9 @@ export function validateExperimentalFeatures(`
`56`	`56`	`) {`
`57`	`57`	`unsupportedFeatures.push("excludeTools");`
`58`	`58`	`}`
	`59`	`+ if (executeOptions?.output) {`
	`60`	`+ unsupportedFeatures.push("output schema");`
	`61`	`+ }`
`59`	`62`
`60`	`63`	`if (unsupportedFeatures.length > 0) {`
`61`	`64`	`throw new StagehandInvalidArgumentError(`
`@@ -97,6 +100,9 @@ export function validateExperimentalFeatures(`
`97`	`100`	`if (executeOptions.excludeTools && executeOptions.excludeTools.length > 0) {`
`98`	`101`	`features.push("excludeTools");`
`99`	`102`	`}`
	`103`	`+ if (executeOptions.output) {`
	`104`	`+ features.push("output schema");`
	`105`	`+ }`
`100`	`106`	`}`
`101`	`107`
`102`	`108`	`if (features.length > 0) {`