|
19 | 19 |
|
20 | 20 | import numpy as np
|
21 | 21 |
|
| 22 | +from fastdeploy import envs |
22 | 23 | from fastdeploy.input.preprocess import InputPreprocessor
|
23 | 24 | from fastdeploy.inter_communicator import IPCSignal, ZmqClient
|
24 | 25 | from fastdeploy.metrics.work_metrics import work_process_metrics
|
@@ -144,6 +145,26 @@ def add_requests(self, task):
|
144 | 145 | api_server_logger.error(error_msg)
|
145 | 146 | raise EngineError(error_msg, error_code=400)
|
146 | 147 |
|
| 148 | + if "stop_seqs_len" in task: |
| 149 | + stop_seqs_len = task["stop_seqs_len"] |
| 150 | + max_stop_seqs_num = int(envs.FD_MAX_STOP_SEQS_NUM) |
| 151 | + if len(stop_seqs_len) > max_stop_seqs_num: |
| 152 | + error_msg = ( |
| 153 | + f"Length of stop ({stop_seqs_len}) exceeds the limit max_model_len({max_stop_seqs_num})." |
| 154 | + "Please reduce the number of stop or set a lager max_stop_seqs_num by `FD_MAX_STOP_SEQS_NUM`" |
| 155 | + ) |
| 156 | + api_server_logger.error(error_msg) |
| 157 | + raise EngineError(error_msg, error_code=400) |
| 158 | + stop_seqs_max_len = int(envs.FD_STOP_SEQS_MAX_LEN) |
| 159 | + for single_stop_seq_len in stop_seqs_len: |
| 160 | + if single_stop_seq_len > stop_seqs_max_len: |
| 161 | + error_msg = ( |
| 162 | + f"Length of stop_seqs({single_stop_seq_len}) exceeds the limit max_model_len({stop_seqs_max_len})." |
| 163 | + "Please reduce the length of stop sequences or set a larger stop_seqs_max_len by `FD_STOP_SEQS_MAX_LEN`" |
| 164 | + ) |
| 165 | + api_server_logger.error(error_msg) |
| 166 | + raise EngineError(error_msg, error_code=400) |
| 167 | + |
147 | 168 | task["preprocess_end_time"] = time.time()
|
148 | 169 | preprocess_cost_time = task["preprocess_end_time"] - task["preprocess_start_time"]
|
149 | 170 | api_server_logger.info(
|
|
0 commit comments