appleeji commited on
Commit
e3c1ce6
·
verified ·
1 Parent(s): 92318df

Upload ds_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. ds_config.json +44 -0
ds_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bf16": {
3
+ "enabled": true
4
+ },
5
+ "fp16": {
6
+ "enabled": false
7
+ },
8
+ "optimizer": {
9
+ "type": "AdamW",
10
+ "params": {
11
+ "lr": 0,
12
+ "weight_decay": 0.05,
13
+ "adam_w_mode": true,
14
+ "betas": [
15
+ 0.9,
16
+ 0.95
17
+ ]
18
+ }
19
+ },
20
+ "scheduler": {
21
+ "type": "WarmupDecayLR",
22
+ "params": {
23
+ "warmup_min_lr": 0,
24
+ "warmup_max_lr": 5e-4,
25
+ "warmup_num_steps": 500,
26
+ "total_num_steps": 50000
27
+ }
28
+ },
29
+ "zero_optimization": {
30
+ "stage": 2,
31
+ "stage3_gather_16bit_weights_on_model_save": true,
32
+ "allgather_partitions": true,
33
+ "allgather_bucket_size": 5e8,
34
+ "overlap_comm": true,
35
+ "reduce_scatter": true,
36
+ "reduce_bucket_size": 5e8,
37
+ "contiguous_gradients": true
38
+ },
39
+ "gradient_accumulation_steps": 3,
40
+ "gradient_clipping": 1.0,
41
+ "steps_per_print": 100,
42
+ "train_micro_batch_size_per_gpu": 3,
43
+ "wall_clock_breakdown": false
44
+ }