| epoch: 36 | |
| LearningRate: | |
| base_lr: 0.000025 | |
| schedulers: | |
| - !PiecewiseDecay | |
| gamma: 0.1 | |
| milestones: [28, 34] | |
| - !LinearWarmup | |
| start_factor: 0.01 | |
| steps: 1000 | |
| OptimizerBuilder: | |
| clip_grad_by_norm: 1.0 | |
| optimizer: | |
| type: AdamW | |
| weight_decay: 0.0001 | |
| epoch: 36 | |
| LearningRate: | |
| base_lr: 0.000025 | |
| schedulers: | |
| - !PiecewiseDecay | |
| gamma: 0.1 | |
| milestones: [28, 34] | |
| - !LinearWarmup | |
| start_factor: 0.01 | |
| steps: 1000 | |
| OptimizerBuilder: | |
| clip_grad_by_norm: 1.0 | |
| optimizer: | |
| type: AdamW | |
| weight_decay: 0.0001 | |