| { |
| "best_global_step": 1500, |
| "best_metric": 0.7632915279870514, |
| "best_model_checkpoint": "/Users/wangyiqiu/Desktop/program/\u795e\u7ecf\u7f51\u7edc\u62d3\u6251/results/checkpoint-1500", |
| "epoch": 0.09475679090334807, |
| "eval_steps": 500, |
| "global_step": 1500, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.006317119393556538, |
| "grad_norm": 13.061114311218262, |
| "learning_rate": 4.169298799747316e-07, |
| "loss": 1.354, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.012634238787113077, |
| "grad_norm": 13.682186126708984, |
| "learning_rate": 8.380711728785009e-07, |
| "loss": 1.0853, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.018951358180669616, |
| "grad_norm": 4.851679801940918, |
| "learning_rate": 1.2592124657822702e-06, |
| "loss": 0.9111, |
| "step": 300 |
| }, |
| { |
| "epoch": 0.025268477574226154, |
| "grad_norm": 5.82253360748291, |
| "learning_rate": 1.6803537586860393e-06, |
| "loss": 0.7179, |
| "step": 400 |
| }, |
| { |
| "epoch": 0.03158559696778269, |
| "grad_norm": 5.032683372497559, |
| "learning_rate": 2.1014950515898086e-06, |
| "loss": 0.6422, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.03158559696778269, |
| "eval_accuracy": 0.7368075050637859, |
| "eval_f1": 0.7170832086299176, |
| "eval_loss": 0.6070035696029663, |
| "eval_precision": 0.7218199142709759, |
| "eval_recall": 0.7368075050637859, |
| "eval_runtime": 582.5178, |
| "eval_samples_per_second": 96.619, |
| "eval_steps_per_second": 3.02, |
| "step": 500 |
| }, |
| { |
| "epoch": 0.03790271636133923, |
| "grad_norm": 7.424877166748047, |
| "learning_rate": 2.5226363444935774e-06, |
| "loss": 0.6155, |
| "step": 600 |
| }, |
| { |
| "epoch": 0.04421983575489577, |
| "grad_norm": 16.976255416870117, |
| "learning_rate": 2.943777637397347e-06, |
| "loss": 0.5944, |
| "step": 700 |
| }, |
| { |
| "epoch": 0.05053695514845231, |
| "grad_norm": 9.103567123413086, |
| "learning_rate": 3.3649189303011164e-06, |
| "loss": 0.5812, |
| "step": 800 |
| }, |
| { |
| "epoch": 0.056854074542008845, |
| "grad_norm": 7.061375617980957, |
| "learning_rate": 3.7860602232048853e-06, |
| "loss": 0.5965, |
| "step": 900 |
| }, |
| { |
| "epoch": 0.06317119393556538, |
| "grad_norm": 6.224503040313721, |
| "learning_rate": 4.207201516108655e-06, |
| "loss": 0.5553, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.06317119393556538, |
| "eval_accuracy": 0.7581642443409972, |
| "eval_f1": 0.7448374295446439, |
| "eval_loss": 0.5610596537590027, |
| "eval_precision": 0.7461287482946488, |
| "eval_recall": 0.7581642443409972, |
| "eval_runtime": 584.5541, |
| "eval_samples_per_second": 96.282, |
| "eval_steps_per_second": 3.009, |
| "step": 1000 |
| }, |
| { |
| "epoch": 0.06948831332912192, |
| "grad_norm": 6.321476459503174, |
| "learning_rate": 4.628342809012423e-06, |
| "loss": 0.592, |
| "step": 1100 |
| }, |
| { |
| "epoch": 0.07580543272267846, |
| "grad_norm": 8.201200485229492, |
| "learning_rate": 5.0494841019161935e-06, |
| "loss": 0.5518, |
| "step": 1200 |
| }, |
| { |
| "epoch": 0.082122552116235, |
| "grad_norm": 6.514477729797363, |
| "learning_rate": 5.470625394819963e-06, |
| "loss": 0.5897, |
| "step": 1300 |
| }, |
| { |
| "epoch": 0.08843967150979154, |
| "grad_norm": 8.077017784118652, |
| "learning_rate": 5.891766687723732e-06, |
| "loss": 0.5476, |
| "step": 1400 |
| }, |
| { |
| "epoch": 0.09475679090334807, |
| "grad_norm": 9.256704330444336, |
| "learning_rate": 6.3129079806275005e-06, |
| "loss": 0.5263, |
| "step": 1500 |
| }, |
| { |
| "epoch": 0.09475679090334807, |
| "eval_accuracy": 0.7675278064034683, |
| "eval_f1": 0.7632915279870514, |
| "eval_loss": 0.5426821112632751, |
| "eval_precision": 0.760979358962669, |
| "eval_recall": 0.7675278064034683, |
| "eval_runtime": 587.2504, |
| "eval_samples_per_second": 95.84, |
| "eval_steps_per_second": 2.995, |
| "step": 1500 |
| } |
| ], |
| "logging_steps": 100, |
| "max_steps": 47490, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 3, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 3157361012736000.0, |
| "train_batch_size": 32, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|