Skip to content

Commit 5850472

Browse files
authored
fix pt deploy lora (#999)
1 parent 4d76577 commit 5850472

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

swift/llm/infer.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -194,7 +194,7 @@ def prepare_model_template(args: InferArguments,
194194
f'args.max_model_len: {args.max_model_len}, model.max_model_len: {model.max_model_len}')
195195
# Preparing LoRA
196196
if is_adapter(args.sft_type) and args.ckpt_dir is not None:
197-
if isinstance(args, DeployArguments):
197+
if isinstance(args, DeployArguments) and args.lora_request_list is not None:
198198
for lora_request in args.lora_request_list:
199199
model = Swift.from_pretrained(
200200
model, lora_request.lora_local_path, lora_request.lora_name, inference_mode=True)

swift/llm/utils/argument.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1133,7 +1133,7 @@ def handle_infer_backend(self):
11331133
or self.infer_backend == 'pt' and isinstance(self, DeployArguments) and self.sft_type == 'lora'):
11341134
assert self.ckpt_dir is not None
11351135
self.lora_modules.append(f'default-lora={self.ckpt_dir}')
1136-
self.lora_request_list = _parse_lora_modules(self.lora_modules, True)
1136+
self.lora_request_list = _parse_lora_modules(self.lora_modules, self.infer_backend == 'vllm')
11371137
logger.info(f'args.lora_request_list: {self.lora_request_list}')
11381138

11391139
template_info = TEMPLATE_MAPPING[self.template_type]

0 commit comments

Comments
 (0)