File tree Expand file tree Collapse file tree 3 files changed +5
-5
lines changed Expand file tree Collapse file tree 3 files changed +5
-5
lines changed Original file line number Diff line number Diff line change @@ -46,8 +46,10 @@ def initialize_megatron(*_args, **kwargs):
46
46
else :
47
47
raise ValueError (
48
48
'You are using a streaming training dataset. Please explicitly specify `--train_iters`.' )
49
- if val_dataset is not None and args .eval_iters < 0 :
50
- if hasattr (val_dataset , '__len__' ):
49
+ if args .eval_iters < 0 :
50
+ if val_dataset is None :
51
+ args .eval_iters = 0
52
+ elif hasattr (val_dataset , '__len__' ):
51
53
dataset_sample = len (val_dataset ) // step_batch_size * step_batch_size
52
54
args .eval_iters = max (dataset_sample // args .global_batch_size , 1 )
53
55
else :
Original file line number Diff line number Diff line change @@ -15,8 +15,7 @@ def swift_datasets_provider(train_val_test_num_samples):
15
15
nonlocal val_dataset
16
16
args = get_args ()
17
17
data_parallel_size = mpu .get_data_parallel_world_size ()
18
- step_batch_size = \
19
- args .micro_batch_size * data_parallel_size
18
+ step_batch_size = args .micro_batch_size * data_parallel_size
20
19
# To avoid errors caused by the validation set being insufficient to complete a single step.
21
20
if val_dataset is not None and len (val_dataset ) < step_batch_size :
22
21
val_dataset = None
Original file line number Diff line number Diff line change @@ -17,7 +17,6 @@ def test_sft():
17
17
train_iters = 100 ,
18
18
model_author = 'swift' ,
19
19
model_name = 'swift-robot' ,
20
- eval_iters = 5 ,
21
20
sequence_parallel = True ,
22
21
finetune = True ))
23
22
You can’t perform that action at this time.
0 commit comments