Skip to content

Commit 3742dbe

Browse files
Update test_browser_use.py
1 parent 18625cf commit 3742dbe

File tree

1 file changed

+56
-50
lines changed

1 file changed

+56
-50
lines changed

tests/test_browser_use.py

Lines changed: 56 additions & 50 deletions
Original file line numberDiff line numberDiff line change
@@ -3,19 +3,18 @@
33
# @Author : wenshao
44
# @ProjectName: browser-use-webui
55
# @FileName: test_browser_use.py
6-
import pdb
76

87
from dotenv import load_dotenv
98

109
load_dotenv()
1110
import sys
1211

1312
sys.path.append(".")
13+
import asyncio
1414
import os
1515
import sys
1616
from pprint import pprint
1717

18-
import asyncio
1918
from browser_use import Agent
2019
from browser_use.agent.views import AgentHistoryList
2120

@@ -25,16 +24,16 @@
2524
async def test_browser_use_org():
2625
from browser_use.browser.browser import Browser, BrowserConfig
2726
from browser_use.browser.context import (
28-
BrowserContext,
2927
BrowserContextConfig,
3028
BrowserContextWindowSize,
3129
)
30+
3231
llm = utils.get_llm_model(
3332
provider="azure_openai",
3433
model_name="gpt-4o",
3534
temperature=0.8,
3635
base_url=os.getenv("AZURE_OPENAI_ENDPOINT", ""),
37-
api_key=os.getenv("AZURE_OPENAI_API_KEY", "")
36+
api_key=os.getenv("AZURE_OPENAI_API_KEY", ""),
3837
)
3938

4039
window_w, window_h = 1920, 1080
@@ -43,16 +42,18 @@ async def test_browser_use_org():
4342
config=BrowserConfig(
4443
headless=False,
4544
disable_security=True,
46-
extra_chromium_args=[f'--window-size={window_w},{window_h}'],
45+
extra_chromium_args=[f"--window-size={window_w},{window_h}"],
4746
)
4847
)
4948
async with await browser.new_context(
50-
config=BrowserContextConfig(
51-
trace_path='./tmp/traces',
52-
save_recording_path="./tmp/record_videos",
53-
no_viewport=False,
54-
browser_window_size=BrowserContextWindowSize(width=window_w, height=window_h),
55-
)
49+
config=BrowserContextConfig(
50+
trace_path="./tmp/traces",
51+
save_recording_path="./tmp/record_videos",
52+
no_viewport=False,
53+
browser_window_size=BrowserContextWindowSize(
54+
width=window_w, height=window_h
55+
),
56+
)
5657
) as browser_context:
5758
agent = Agent(
5859
task="go to google.com and type 'OpenAI' click search and give me the first url",
@@ -61,32 +62,32 @@ async def test_browser_use_org():
6162
)
6263
history: AgentHistoryList = await agent.run(max_steps=10)
6364

64-
print('Final Result:')
65+
print("Final Result:")
6566
pprint(history.final_result(), indent=4)
6667

67-
print('\nErrors:')
68+
print("\nErrors:")
6869
pprint(history.errors(), indent=4)
6970

7071
# e.g. xPaths the model clicked on
71-
print('\nModel Outputs:')
72+
print("\nModel Outputs:")
7273
pprint(history.model_actions(), indent=4)
7374

74-
print('\nThoughts:')
75+
print("\nThoughts:")
7576
pprint(history.model_thoughts(), indent=4)
7677
# close browser
7778
await browser.close()
7879

7980

8081
async def test_browser_use_custom():
81-
from playwright.async_api import async_playwright
8282
from browser_use.browser.context import BrowserContextWindowSize
83+
from browser_use.browser.browser import BrowserConfig
84+
from playwright.async_api import async_playwright
8385

84-
from src.browser.custom_browser import CustomBrowser, BrowserConfig
85-
from src.browser.custom_context import BrowserContext, BrowserContextConfig
86-
from src.controller.custom_controller import CustomController
8786
from src.agent.custom_agent import CustomAgent
8887
from src.agent.custom_prompts import CustomSystemPrompt
89-
from src.browser.custom_context import CustomBrowserContext
88+
from src.browser.custom_browser import CustomBrowser
89+
from src.browser.custom_context import BrowserContextConfig
90+
from src.controller.custom_controller import CustomController
9091

9192
window_w, window_h = 1920, 1080
9293

@@ -95,32 +96,32 @@ async def test_browser_use_custom():
9596
# model_name="gpt-4o",
9697
# temperature=0.8,
9798
# base_url=os.getenv("AZURE_OPENAI_ENDPOINT", ""),
98-
# api_key=os.getenv("AZURE_OPENAI_API_KEY", "")
99+
# api_key=os.getenv("AZURE_OPENAI_API_KEY", ""),
99100
# )
100101

101-
# llm = utils.get_llm_model(
102-
# provider="gemini",
103-
# model_name="gemini-2.0-flash-exp",
104-
# temperature=1.0,
105-
# api_key=os.getenv("GOOGLE_API_KEY", "")
106-
# )
102+
llm = utils.get_llm_model(
103+
provider="gemini",
104+
model_name="gemini-2.0-flash-exp",
105+
temperature=1.0,
106+
api_key=os.getenv("GOOGLE_API_KEY", "")
107+
)
107108

108109
# llm = utils.get_llm_model(
109110
# provider="deepseek",
110111
# model_name="deepseek-chat",
111112
# temperature=0.8
112113
# )
113114

114-
llm = utils.get_llm_model(
115-
provider="ollama",
116-
model_name="qwen2.5:7b",
117-
temperature=0.8
118-
)
115+
# llm = utils.get_llm_model(
116+
# provider="ollama", model_name="qwen2.5:7b", temperature=0.8
117+
# )
119118

120119
controller = CustomController()
121120
use_own_browser = False
122121
disable_security = True
123-
use_vision = False
122+
use_vision = True # Set to False when using DeepSeek
123+
tool_call_in_content = True # Set to True when using Ollama
124+
max_actions_per_step = 1
124125
playwright = None
125126
browser_context_ = None
126127
try:
@@ -134,14 +135,14 @@ async def test_browser_use_custom():
134135
no_viewport=False,
135136
headless=False, # 保持浏览器窗口可见
136137
user_agent=(
137-
'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 '
138-
'(KHTML, like Gecko) Chrome/85.0.4183.102 Safari/537.36'
138+
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
139+
"(KHTML, like Gecko) Chrome/85.0.4183.102 Safari/537.36"
139140
),
140141
java_script_enabled=True,
141142
bypass_csp=disable_security,
142143
ignore_https_errors=disable_security,
143144
record_video_dir="./tmp/record_videos",
144-
record_video_size={'width': window_w, 'height': window_h}
145+
record_video_size={"width": window_w, "height": window_h},
145146
)
146147
else:
147148
browser_context_ = None
@@ -150,18 +151,20 @@ async def test_browser_use_custom():
150151
config=BrowserConfig(
151152
headless=False,
152153
disable_security=True,
153-
extra_chromium_args=[f'--window-size={window_w},{window_h}'],
154+
extra_chromium_args=[f"--window-size={window_w},{window_h}"],
154155
)
155156
)
156157

157158
async with await browser.new_context(
158-
config=BrowserContextConfig(
159-
trace_path='./tmp/result_processing',
160-
save_recording_path="./tmp/record_videos",
161-
no_viewport=False,
162-
browser_window_size=BrowserContextWindowSize(width=window_w, height=window_h),
159+
config=BrowserContextConfig(
160+
trace_path="./tmp/result_processing",
161+
save_recording_path="./tmp/record_videos",
162+
no_viewport=False,
163+
browser_window_size=BrowserContextWindowSize(
164+
width=window_w, height=window_h
163165
),
164-
context=browser_context_
166+
),
167+
context=browser_context_,
165168
) as browser_context:
166169
agent = CustomAgent(
167170
task="go to google.com and type 'OpenAI' click search and give me the first url",
@@ -170,25 +173,28 @@ async def test_browser_use_custom():
170173
browser_context=browser_context,
171174
controller=controller,
172175
system_prompt_class=CustomSystemPrompt,
173-
use_vision=use_vision
176+
use_vision=use_vision,
177+
tool_call_in_content=tool_call_in_content,
178+
max_actions_per_step=max_actions_per_step
174179
)
175180
history: AgentHistoryList = await agent.run(max_steps=10)
176181

177-
print('Final Result:')
182+
print("Final Result:")
178183
pprint(history.final_result(), indent=4)
179184

180-
print('\nErrors:')
185+
print("\nErrors:")
181186
pprint(history.errors(), indent=4)
182187

183188
# e.g. xPaths the model clicked on
184-
print('\nModel Outputs:')
189+
print("\nModel Outputs:")
185190
pprint(history.model_actions(), indent=4)
186191

187-
print('\nThoughts:')
192+
print("\nThoughts:")
188193
pprint(history.model_thoughts(), indent=4)
189194
# close browser
190-
except Exception as e:
195+
except Exception:
191196
import traceback
197+
192198
traceback.print_exc()
193199
finally:
194200
# 显式关闭持久化上下文
@@ -202,6 +208,6 @@ async def test_browser_use_custom():
202208
await browser.close()
203209

204210

205-
if __name__ == '__main__':
211+
if __name__ == "__main__":
206212
# asyncio.run(test_browser_use_org())
207213
asyncio.run(test_browser_use_custom())

0 commit comments

Comments
 (0)