@@ -60,7 +60,7 @@ def __init__(
60
60
f"Set global litellm.api_base to { value } " , category = "llm"
61
61
)
62
62
63
- def create_response (
63
+ async def create_response (
64
64
self ,
65
65
* ,
66
66
messages : list [dict [str , str ]],
@@ -77,7 +77,7 @@ def create_response(
77
77
Overrides the default_model if provided.
78
78
function_name: The name of the Stagehand function calling this method (ACT, OBSERVE, etc.)
79
79
Used for metrics tracking.
80
- **kwargs: Additional parameters to pass directly to litellm.completion
80
+ **kwargs: Additional parameters to pass directly to litellm.acompletion
81
81
(e.g., temperature, max_tokens, stream=True, specific provider arguments).
82
82
83
83
Returns:
@@ -87,7 +87,7 @@ def create_response(
87
87
88
88
Raises:
89
89
ValueError: If no model is specified (neither default nor in the call).
90
- Exception: Propagates exceptions from litellm.completion .
90
+ Exception: Propagates exceptions from litellm.acompletion .
91
91
"""
92
92
completion_model = model or self .default_model
93
93
if not completion_model :
@@ -115,16 +115,16 @@ def create_response(
115
115
filtered_params ["temperature" ] = 1
116
116
117
117
self .logger .debug (
118
- f"Calling litellm.completion with model={ completion_model } and params: { filtered_params } " ,
118
+ f"Calling litellm.acompletion with model={ completion_model } and params: { filtered_params } " ,
119
119
category = "llm" ,
120
120
)
121
121
122
122
try :
123
123
# Start tracking inference time
124
124
start_time = start_inference_timer ()
125
125
126
- # Use litellm's completion function
127
- response = litellm .completion (** filtered_params )
126
+ # Use litellm's async completion function
127
+ response = await litellm .acompletion (** filtered_params )
128
128
129
129
# Calculate inference time
130
130
inference_time_ms = get_inference_time_ms (start_time )
@@ -136,6 +136,6 @@ def create_response(
136
136
return response
137
137
138
138
except Exception as e :
139
- self .logger .error (f"Error calling litellm.completion : { e } " , category = "llm" )
139
+ self .logger .error (f"Error calling litellm.acompletion : { e } " , category = "llm" )
140
140
# Consider more specific exception handling based on litellm errors
141
141
raise
0 commit comments