3040d13
1
2
3
4
5
6
7
8
9
10
11
12
13
14
{ "zero_optimization": { "stage": 2, "allgather_partitions": true, "reduce_scatter": true, "contiguous_gradients": true }, "bf16": { "enabled": true }, "gradient_clipping": 1.0, "train_batch_size": 1, "gradient_accumulation_steps": 4 }