File tree Expand file tree Collapse file tree 2 files changed +3
-1
lines changed Expand file tree Collapse file tree 2 files changed +3
-1
lines changed Original file line number Diff line number Diff line change @@ -130,6 +130,8 @@ async def check_length(
130
130
input_ids = tokenizer (prompt ).input_ids
131
131
token_num = len (input_ids )
132
132
133
+ if request .max_tokens is None :
134
+ request .max_tokens = max_model_len - token_num
133
135
if token_num + request .max_tokens > max_model_len :
134
136
return input_ids , create_error_response (
135
137
HTTPStatus .BAD_REQUEST ,
Original file line number Diff line number Diff line change @@ -58,7 +58,7 @@ class ChatCompletionRequest(BaseModel):
58
58
temperature : Optional [float ] = 0.7
59
59
top_p : Optional [float ] = 1.0
60
60
n : Optional [int ] = 1
61
- max_tokens : Optional [int ] = 16
61
+ max_tokens : Optional [int ] = None
62
62
stop : Optional [Union [str , List [str ]]] = Field (default_factory = list )
63
63
stream : Optional [bool ] = False
64
64
presence_penalty : Optional [float ] = 0.0
You can’t perform that action at this time.
0 commit comments