s23deepak commited on
Commit
374b17e
·
verified ·
1 Parent(s): 14e1bb9

Add DeepSpeed ZeRO-3 config

Browse files
Files changed (1) hide show
  1. scripts/zero3.json +31 -0
scripts/zero3.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "fp16": {
3
+ "enabled": false
4
+ },
5
+ "bf16": {
6
+ "enabled": true
7
+ },
8
+ "zero_optimization": {
9
+ "stage": 3,
10
+ "offload_optimizer": {
11
+ "device": "none"
12
+ },
13
+ "offload_param": {
14
+ "device": "none"
15
+ },
16
+ "overlap_comm": true,
17
+ "contiguous_gradients": true,
18
+ "sub_group_size": 1e9,
19
+ "reduce_bucket_size": "auto",
20
+ "stage3_prefetch_bucket_size": "auto",
21
+ "stage3_param_persistence_threshold": "auto",
22
+ "stage3_max_live_parameters": 1e9,
23
+ "stage3_max_reuse_distance": 1e9,
24
+ "stage3_gather_16bit_weights_on_model_save": true
25
+ },
26
+ "gradient_accumulation_steps": "auto",
27
+ "gradient_clipping": "auto",
28
+ "train_batch_size": "auto",
29
+ "train_micro_batch_size_per_gpu": "auto",
30
+ "wall_clock_breakdown": false
31
+ }