@@ -41,12 +41,12 @@ async def get_next_action(model, messages, objective, session_id):
4141 print ("[Self-Operating Computer][get_next_action]" )
4242 print ("[Self-Operating Computer][get_next_action] model" , model )
4343 if model == "gpt-4" :
44- return call_gpt_4_vision_preview (messages ), None
44+ return call_gpt_4o (messages ), None
4545 if model == "gpt-4-with-som" :
46- operation = await call_gpt_4_vision_preview_labeled (messages , objective , model )
46+ operation = await call_gpt_4o_labeled (messages , objective , model )
4747 return operation , None
4848 if model == "gpt-4-with-ocr" :
49- operation = await call_gpt_4_vision_preview_ocr (messages , objective , model )
49+ operation = await call_gpt_4o_with_ocr (messages , objective , model )
5050 return operation , None
5151 if model == "agent-1" :
5252 return "coming soon"
@@ -61,7 +61,7 @@ async def get_next_action(model, messages, objective, session_id):
6161 raise ModelNotRecognizedException (model )
6262
6363
64- def call_gpt_4_vision_preview (messages ):
64+ def call_gpt_4o (messages ):
6565 if config .verbose :
6666 print ("[call_gpt_4_v]" )
6767 time .sleep (1 )
@@ -102,7 +102,7 @@ def call_gpt_4_vision_preview(messages):
102102 messages .append (vision_message )
103103
104104 response = client .chat .completions .create (
105- model = "gpt-4-vision-preview " ,
105+ model = "gpt-4o " ,
106106 messages = messages ,
107107 presence_penalty = 1 ,
108108 frequency_penalty = 1 ,
@@ -137,7 +137,7 @@ def call_gpt_4_vision_preview(messages):
137137 )
138138 if config .verbose :
139139 traceback .print_exc ()
140- return call_gpt_4_vision_preview (messages )
140+ return call_gpt_4o (messages )
141141
142142
143143def call_gemini_pro_vision (messages , objective ):
@@ -189,12 +189,12 @@ def call_gemini_pro_vision(messages, objective):
189189 if config .verbose :
190190 print ("[Self-Operating Computer][Operate] error" , e )
191191 traceback .print_exc ()
192- return call_gpt_4_vision_preview (messages )
192+ return call_gpt_4o (messages )
193193
194194
195- async def call_gpt_4_vision_preview_ocr (messages , objective , model ):
195+ async def call_gpt_4o_with_ocr (messages , objective , model ):
196196 if config .verbose :
197- print ("[call_gpt_4_vision_preview_ocr ]" )
197+ print ("[call_gpt_4o_with_ocr ]" )
198198
199199 # Construct the path to the file within the package
200200 try :
@@ -231,7 +231,7 @@ async def call_gpt_4_vision_preview_ocr(messages, objective, model):
231231 messages .append (vision_message )
232232
233233 response = client .chat .completions .create (
234- model = "gpt-4-vision-preview " ,
234+ model = "gpt-4o " ,
235235 messages = messages ,
236236 temperature = 0.7 ,
237237 max_tokens = 3000 ,
@@ -253,7 +253,7 @@ async def call_gpt_4_vision_preview_ocr(messages, objective, model):
253253 text_to_click = operation .get ("text" )
254254 if config .verbose :
255255 print (
256- "[call_gpt_4_vision_preview_ocr ][click] text_to_click" ,
256+ "[call_gpt_4o_with_ocr ][click] text_to_click" ,
257257 text_to_click ,
258258 )
259259 # Initialize EasyOCR Reader
@@ -275,15 +275,15 @@ async def call_gpt_4_vision_preview_ocr(messages, objective, model):
275275
276276 if config .verbose :
277277 print (
278- "[call_gpt_4_vision_preview_ocr ][click] text_element_index" ,
278+ "[call_gpt_4o_with_ocr ][click] text_element_index" ,
279279 text_element_index ,
280280 )
281281 print (
282- "[call_gpt_4_vision_preview_ocr ][click] coordinates" ,
282+ "[call_gpt_4o_with_ocr ][click] coordinates" ,
283283 coordinates ,
284284 )
285285 print (
286- "[call_gpt_4_vision_preview_ocr ][click] final operation" ,
286+ "[call_gpt_4o_with_ocr ][click] final operation" ,
287287 operation ,
288288 )
289289 processed_content .append (operation )
@@ -307,7 +307,7 @@ async def call_gpt_4_vision_preview_ocr(messages, objective, model):
307307 return gpt_4_fallback (messages , objective , model )
308308
309309
310- async def call_gpt_4_vision_preview_labeled (messages , objective , model ):
310+ async def call_gpt_4o_labeled (messages , objective , model ):
311311 time .sleep (1 )
312312
313313 try :
@@ -355,7 +355,7 @@ async def call_gpt_4_vision_preview_labeled(messages, objective, model):
355355 messages .append (vision_message )
356356
357357 response = client .chat .completions .create (
358- model = "gpt-4-vision-preview " ,
358+ model = "gpt-4o " ,
359359 messages = messages ,
360360 presence_penalty = 1 ,
361361 frequency_penalty = 1 ,
@@ -415,7 +415,7 @@ async def call_gpt_4_vision_preview_labeled(messages, objective, model):
415415 print (
416416 f"{ ANSI_GREEN } [Self-Operating Computer]{ ANSI_RED } [Error] Failed to get click position in percent. Trying another method { ANSI_RESET } "
417417 )
418- return call_gpt_4_vision_preview (messages )
418+ return call_gpt_4o (messages )
419419
420420 x_percent = f"{ click_position_percent [0 ]:.2f} "
421421 y_percent = f"{ click_position_percent [1 ]:.2f} "
@@ -450,7 +450,7 @@ async def call_gpt_4_vision_preview_labeled(messages, objective, model):
450450 if config .verbose :
451451 print ("[Self-Operating Computer][Operate] error" , e )
452452 traceback .print_exc ()
453- return call_gpt_4_vision_preview (messages )
453+ return call_gpt_4o (messages )
454454
455455
456456def call_ollama_llava (messages ):
@@ -742,7 +742,7 @@ def get_last_assistant_message(messages):
742742def gpt_4_fallback (messages , objective , model ):
743743 if config .verbose :
744744 print ("[gpt_4_fallback]" )
745- system_prompt = get_system_prompt ("gpt-4-vision-preview " , objective )
745+ system_prompt = get_system_prompt ("gpt-4o " , objective )
746746 new_system_message = {"role" : "system" , "content" : system_prompt }
747747 # remove and replace the first message in `messages` with `new_system_message`
748748
@@ -752,7 +752,7 @@ def gpt_4_fallback(messages, objective, model):
752752 print ("[gpt_4_fallback][updated]" )
753753 print ("[gpt_4_fallback][updated] len(messages)" , len (messages ))
754754
755- return call_gpt_4_vision_preview (messages )
755+ return call_gpt_4o (messages )
756756
757757
758758def confirm_system_prompt (messages , objective , model ):
0 commit comments