| { | |
| "train_batch_size": 8, | |
| "gradient_accumulation_steps": 8, | |
| "zero_optimization": { | |
| "stage": 2 | |
| }, | |
| "mixed_precision": "bf16", | |
| "bf16": { | |
| "enabled": true | |
| }, | |
| "fp16": { | |
| "enabled": false | |
| }, | |
| "zero_allow_untested_optimizer": true | |
| } | |
| { | |
| "train_batch_size": 8, | |
| "gradient_accumulation_steps": 8, | |
| "zero_optimization": { | |
| "stage": 2 | |
| }, | |
| "mixed_precision": "bf16", | |
| "bf16": { | |
| "enabled": true | |
| }, | |
| "fp16": { | |
| "enabled": false | |
| }, | |
| "zero_allow_untested_optimizer": true | |
| } | |