Skip to content

Commit 4f6007e

Browse files
authored
fix freeze parameters bug (#325)
1 parent b8f2b7f commit 4f6007e

File tree

3 files changed

+6
-3
lines changed

3 files changed

+6
-3
lines changed

swift/llm/utils/argument.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -260,7 +260,9 @@ def __post_init__(self) -> None:
260260
and len(
261261
self.custom_val_dataset_path) == 0
262262
and self.self_cognition_sample == 0):
263-
raise ValueError(f'self.dataset: {self.dataset}')
263+
raise ValueError(
264+
f'self.dataset: {self.dataset}, Please input the training dataset.'
265+
)
264266

265267
if self.save_steps is None:
266268
self.save_steps = self.eval_steps

swift/utils/run_utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ def get_main(
1515

1616
def x_main(argv: Union[List[str], _TArgsClass, NoneType] = None,
1717
**kwargs) -> _T:
18-
if isinstance(argv, args_class):
18+
if not isinstance(argv, (list, tuple, NoneType)):
1919
args, remaining_argv = argv, []
2020
else:
2121
args, remaining_argv = parse_args(args_class, argv)

swift/utils/torch_utils.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -123,7 +123,8 @@ def show_layers(model: Module, max_lines: Optional[int] = 20) -> None:
123123

124124

125125
def freeze_model_parameters(model: Module, freeze_parameters: float) -> None:
126-
n_parameters = np.array([p.numel() for p in model.parameters()])
126+
n_parameters = np.array([p.numel() for p in model.parameters()],
127+
dtype=np.int64)
127128
n_freeze_parameters = int(np.sum(n_parameters) * freeze_parameters)
128129
n_parameters_cs = np.cumsum(n_parameters)
129130
idx = bisect_right(n_parameters_cs, n_freeze_parameters)

0 commit comments

Comments
 (0)