browser-use
diff --git a/‎typescript/agent/.env.example‎
Lines changed: 5 additions & 1 deletion b/‎typescript/agent/.env.example‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎typescript/agent/package.json‎
Lines changed: 2 additions & 1 deletion b/‎typescript/agent/package.json‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎typescript/agent/pnpm-lock.yaml‎
Lines changed: 35 additions & 23 deletions b/‎typescript/agent/pnpm-lock.yaml‎
Lines changed: 35 additions & 23 deletions
diff --git a/‎typescript/agent/src/app/api/chat/route.ts‎
Lines changed: 154 additions & 10 deletions b/‎typescript/agent/src/app/api/chat/route.ts‎
Lines changed: 154 additions & 10 deletions
@@ -1 +1,5 @@
-AI_GATEWAY_API_KEY=""
+# 
+AI_GATEWAY_API_KEY=""
+
+# 
+BROWSER_USE_API_KEY=""
@@ -20,6 +20,7 @@
     "@radix-ui/react-tooltip": "^1.2.8",
     "@radix-ui/react-use-controllable-state": "^1.2.2",
     "ai": "^5.0.13",
+    "browser-use-sdk": "0.1.1",
     "class-variance-authority": "^0.7.1",
     "clsx": "^2.1.1",
     "embla-carousel-react": "^8.6.0",
@@ -36,7 +37,7 @@
     "remark-math": "^6.0.0",
     "tailwind-merge": "^3.3.1",
     "use-stick-to-bottom": "^1.1.1",
-    "zod": "^3.25.76"
+    "zod": "^4"
   },
   "devDependencies": {
     "@eslint/eslintrc": "^3",
 
@@ -1,21 +1,165 @@
-import { streamText, UIMessage, convertToModelMessages } from "ai";
+import {
+  streamText,
+  UIMessage,
+  convertToModelMessages,
+  tool,
+  ToolSet,
+  InferUITools,
+  UIDataTypes,
+  stepCountIs,
+} from "ai";
+import { z } from "zod";
+import { BrowserUse } from "browser-use-sdk";
 
-// Allow streaming responses up to 30 seconds
-export const maxDuration = 30;
+// Allow streaming responses up to 5 minutes
+export const maxDuration = 300;
+
+const bu = new BrowserUse({
+  apiKey: process.env.BROWSER_USE_API_KEY,
+});
+
+type TaskStatus =
+  | {
+      status: "running";
+
+      lastStep: BrowserUse.Tasks.TaskView.Step;
+      liveUrl: string | null;
+    }
+  | {
+      status: "done";
+
+      output: string;
+      liveUrl: string;
+
+      sessionId: string;
+    };
+
+const tools = {
+  runTask: tool({
+    description: "Run a task in a web browser.",
+    inputSchema: z.object({
+      task: z.string(),
+    }),
+    async *execute({ task }) {
+      // Create Task
+      const rsp = await bu.tasks.create({ task: task });
+
+      poll: do {
+        // Wait for Task to Finish
+        const status = (await bu.tasks.retrieve(rsp.id, { statusOnly: false })) as BrowserUse.Tasks.TaskView;
+
+        switch (status.status) {
+          case "started":
+          case "paused":
+          case "stopped":
+            if (status.steps == null || status.steps.length === 0) {
+              break;
+            }
+
+            const lastStep = status.steps[status.steps.length - 1];
+
+            yield {
+              status: "running",
+              lastStep: lastStep,
+              liveUrl: status.sessionLiveUrl ? status.sessionLiveUrl : null,
+            } satisfies TaskStatus;
+
+            await new Promise((resolve) => setTimeout(resolve, 1000));
+
+            break;
+
+          case "finished":
+            if (status.sessionLiveUrl == null) {
+              break;
+            }
+
+            yield {
+              status: "done",
+              output: status.doneOutput,
+              liveUrl: status.sessionLiveUrl,
+              sessionId: status.sessionId,
+            } satisfies TaskStatus;
+
+            break poll;
+
+          default:
+            throw new Error(`Unknown status: ${status.status}`);
+        }
+      } while (true);
+    },
+  }),
+  continueTask: tool({
+    description: "Continue a task in a web browser.",
+    inputSchema: z.object({
+      sessionId: z.string(),
+      task: z.string(),
+    }),
+    async *execute({ sessionId, task }) {
+      // Create Task
+      const rsp = await bu.tasks.create({ task: task, browserSettings: { sessionId: sessionId } });
+
+      poll: do {
+        // Wait for Task to Finish
+        const status = (await bu.tasks.retrieve(rsp.id, { statusOnly: false })) as BrowserUse.Tasks.TaskView;
+
+        switch (status.status) {
+          case "started":
+          case "paused":
+          case "stopped":
+            if (status.steps == null || status.steps.length === 0) {
+              break;
+            }
+
+            const lastStep = status.steps[status.steps.length - 1];
+
+            yield {
+              status: "running",
+              lastStep: lastStep,
+              liveUrl: status.sessionLiveUrl ? status.sessionLiveUrl : null,
+            } satisfies TaskStatus;
+
+            await new Promise((resolve) => setTimeout(resolve, 1000));
+
+            break;
+
+          case "finished":
+            if (status.sessionLiveUrl == null) {
+              break;
+            }
+
+            yield {
+              status: "done",
+              output: status.doneOutput,
+              liveUrl: status.sessionLiveUrl,
+              sessionId: status.sessionId,
+            } satisfies TaskStatus;
+
+            break poll;
+
+          default:
+            throw new Error(`Unknown status: ${status.status}`);
+        }
+      } while (true);
+    },
+  }),
+} satisfies ToolSet;
+
+export type ChatTools = InferUITools<typeof tools>;
+
+export type ChatMessage = UIMessage<never, UIDataTypes, ChatTools>;
+
+// ROUTE
 
 export async function POST(req: Request) {
-  const {
-    messages,
-    model,
-    webSearch,
-  }: { messages: UIMessage[]; model: string; webSearch: boolean } =
-    await req.json();
+  const { messages, model, webSearch }: { messages: UIMessage[]; model: string; webSearch: boolean } = await req.json();
 
   const result = streamText({
     model: webSearch ? "perplexity/sonar" : model,
     messages: convertToModelMessages(messages),
     system:
-      "You are a helpful assistant that can answer questions and help with tasks",
+      "You are a helpful assistant that can answer questions and help with tasks. You can use the tools provided to you to help you answer questions and help with tasks.",
+    tools: tools,
+    stopWhen: stepCountIs(15),
   });
 
   // send sources and reasoning back to the client