-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathds_config.json
More file actions
1 lines (1 loc) · 790 Bytes
/
ds_config.json
File metadata and controls
1 lines (1 loc) · 790 Bytes
1
{"fp16": {"enabled": true}, "zero_optimization": {"stage": 3, "offload_optimizer": {"device": "cpu"}, "offload_param": {"device": "cpu"}, "overlap_comm": true, "contiguous_gradients": true, "reduce_bucket_size": 5e8, "stage3_prefetch_bucket_size": 5e8, "stage3_param_persistence_threshold": 1e6, "sub_group_size": 1e9, "stage3_max_live_parameters": 1e9, "stage3_max_reuse_distance": 1e9, "gather_16bit_weights_on_model_save": true}, "train_batch_size": "auto", "train_micro_batch_size_per_gpu": 2, "gradient_accumulation_steps": 4, "optimizer": {"type": "AdamW", "params": {"lr": 5e-6, "weight_decay": 0.01, "eps": 1e-8}}, "scheduler": {"type": "WarmupLR", "params": {"warmup_min_lr": 0, "warmup_max_lr": 5e-6, "warmup_num_steps": 100}}, "steps_per_print": 10, "wall_clock_breakdown": true}