@@ -139,7 +139,7 @@ def __init__(
139
139
self ._in_process = False
140
140
self ._async_client : Optional [httpx .AsyncClient ] = None
141
141
142
- async def info (self ) -> dict [str , Any ]:
142
+ def info (self ) -> dict [str , Any ]:
143
143
"""
144
144
:return: Dictionary containing backend configuration details.
145
145
"""
@@ -190,7 +190,7 @@ async def process_shutdown(self):
190
190
if not self ._in_process :
191
191
raise RuntimeError ("Backend not started up for process." )
192
192
193
- await self ._async_client .aclose ()
193
+ await self ._async_client .aclose () # type: ignore [union-attr]
194
194
self ._async_client = None
195
195
self ._in_process = False
196
196
@@ -210,7 +210,7 @@ async def validate(self):
210
210
# Model is set, use /health endpoint as first check
211
211
target = f"{ self .target } { self .HEALTH_PATH } "
212
212
headers = self ._get_headers ()
213
- response = await self ._async_client .get (target , headers = headers )
213
+ response = await self ._async_client .get (target , headers = headers ) # type: ignore [union-attr]
214
214
response .raise_for_status ()
215
215
216
216
return
@@ -258,7 +258,7 @@ async def available_models(self) -> list[str]:
258
258
target = f"{ self .target } { self .MODELS_PATH } "
259
259
headers = self ._get_headers ()
260
260
params = self ._get_params (self .MODELS_KEY )
261
- response = await self ._async_client .get (target , headers = headers , params = params )
261
+ response = await self ._async_client .get (target , headers = headers , params = params ) # type: ignore [union-attr]
262
262
response .raise_for_status ()
263
263
264
264
return [item ["id" ] for item in response .json ()["data" ]]
@@ -305,7 +305,7 @@ async def resolve(
305
305
request_id = request .request_id ,
306
306
request_args = {
307
307
"request_type" : request .request_type ,
308
- "output_token_count" : request .constraints .get ("max_output_tokens " ),
308
+ "output_token_count" : request .constraints .get ("output_tokens " ),
309
309
** request .params ,
310
310
},
311
311
value = "" ,
@@ -324,15 +324,15 @@ async def resolve(
324
324
{
325
325
"prompt" : request .content ,
326
326
"request_id" : request .request_id ,
327
- "output_token_count" : request .constraints .get ("max_output_tokens " ),
327
+ "output_token_count" : request .constraints .get ("output_tokens " ),
328
328
"stream_response" : request .params .get ("stream" , self .stream_response ),
329
329
** request .params ,
330
330
}
331
331
if request .request_type == "text_completions"
332
332
else {
333
333
"content" : request .content ,
334
334
"request_id" : request .request_id ,
335
- "output_token_count" : request .constraints .get ("max_output_tokens " ),
335
+ "output_token_count" : request .constraints .get ("output_tokens " ),
336
336
"stream_response" : request .params .get ("stream" , self .stream_response ),
337
337
** request .params ,
338
338
}
@@ -345,7 +345,7 @@ async def resolve(
345
345
if delta is not None :
346
346
if request_info .request_timings .first_iteration is None :
347
347
request_info .request_timings .first_iteration = time .time ()
348
- response .value += delta
348
+ response .value += delta # type: ignore [operator]
349
349
response .delta = delta
350
350
request_info .request_timings .last_iteration = time .time ()
351
351
response .iterations += 1
@@ -396,7 +396,7 @@ async def text_completions(
396
396
yield None , None # Initial yield for async iterator to signal start
397
397
398
398
if not stream_response :
399
- response = await self ._async_client .post (
399
+ response = await self ._async_client .post ( # type: ignore [union-attr]
400
400
target ,
401
401
headers = headers ,
402
402
params = params ,
@@ -411,7 +411,7 @@ async def text_completions(
411
411
return
412
412
413
413
body .update ({"stream" : True , "stream_options" : {"include_usage" : True }})
414
- async with self ._async_client .stream (
414
+ async with self ._async_client .stream ( # type: ignore [union-attr]
415
415
"POST" ,
416
416
target ,
417
417
headers = headers ,
@@ -474,7 +474,7 @@ async def chat_completions(
474
474
yield None , None # Initial yield for async iterator to signal start
475
475
476
476
if not stream_response :
477
- response = await self ._async_client .post (
477
+ response = await self ._async_client .post ( # type: ignore [union-attr]
478
478
target , headers = headers , params = params , json = body
479
479
)
480
480
response .raise_for_status ()
@@ -486,7 +486,7 @@ async def chat_completions(
486
486
return
487
487
488
488
body .update ({"stream" : True , "stream_options" : {"include_usage" : True }})
489
- async with self ._async_client .stream (
489
+ async with self ._async_client .stream ( # type: ignore [union-attr]
490
490
"POST" , target , headers = headers , params = params , json = body
491
491
) as stream :
492
492
stream .raise_for_status ()
0 commit comments