33import httpx
44import asyncio
55from langchain_openai import ChatOpenAI
6- from browser_use import Agent
6+ from browser_use import Agent , Browser
77import mcp .types as types
88from mcp .server .lowlevel import Server
99from dotenv import load_dotenv
10+ from browser_use .browser .context import BrowserContextConfig , BrowserContext
11+
12+ config = BrowserContextConfig (
13+ wait_for_network_idle_page_load_time = 0.6 ,
14+ maximum_wait_page_load_time = 1.2 ,
15+ minimum_wait_page_load_time = 0.2 ,
16+ browser_window_size = {'width' : 1280 , 'height' : 1100 },
17+ locale = 'en-US' ,
18+ user_agent = 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/85.0.4183.102 Safari/537.36' ,
19+ highlight_elements = True ,
20+ viewport_expansion = 500 ,
21+ )
22+
23+ browser = Browser ()
24+ context = BrowserContext (browser = browser , config = config )
1025
1126llm = ChatOpenAI (model = 'gpt-4o' , temperature = 0.0 )
1227planner_llm = ChatOpenAI (
@@ -20,7 +35,7 @@ async def browser_use(
2035 headers = {
2136 "User-Agent" : "browser-use (github.com/co-browser/browser-use-mcp-server)" ,
2237 }
23- agent = Agent (task = action , llm = llm , planner_llm = planner_llm , use_vision_for_planner = False , planner_interval = 1 )
38+ agent = Agent (task = action , llm = llm , browser_context = context )
2439 ret = await agent .run ()
2540 response = ret .final_result ()
2641 return [types .TextContent (type = "text" , text = response )]
0 commit comments