We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0bfdcd2 commit 6e713f4Copy full SHA for 6e713f4
deepspeed.json
@@ -0,0 +1,24 @@
1
+{
2
+ "bf16": {
3
+ "enabled": "auto"
4
+ },
5
+
6
+ "zero_optimization": {
7
+ "stage": 3,
8
+ "overlap_comm": true,
9
+ "contiguous_gradients": true,
10
+ "sub_group_size": 1e9,
11
+ "reduce_bucket_size": "auto",
12
+ "stage3_prefetch_bucket_size": "auto",
13
+ "stage3_param_persistence_threshold": "auto",
14
+ "stage3_max_live_parameters": 1e9,
15
+ "stage3_max_reuse_distance": 1e9,
16
+ "stage3_gather_16bit_weights_on_model_save": true
17
18
19
+ "gradient_accumulation_steps": "auto",
20
+ "steps_per_print": 2000,
21
+ "train_batch_size": "auto",
22
+ "train_micro_batch_size_per_gpu": "auto",
23
+ "wall_clock_breakdown": false
24
+}
0 commit comments