{ "best_global_step": 1000, "best_metric": 0.7448374295446439, "best_model_checkpoint": "/Users/wangyiqiu/Desktop/program/\u795e\u7ecf\u7f51\u7edc\u62d3\u6251/results/checkpoint-1000", "epoch": 0.06317119393556538, "eval_steps": 500, "global_step": 1000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.006317119393556538, "grad_norm": 13.061114311218262, "learning_rate": 4.169298799747316e-07, "loss": 1.354, "step": 100 }, { "epoch": 0.012634238787113077, "grad_norm": 13.682186126708984, "learning_rate": 8.380711728785009e-07, "loss": 1.0853, "step": 200 }, { "epoch": 0.018951358180669616, "grad_norm": 4.851679801940918, "learning_rate": 1.2592124657822702e-06, "loss": 0.9111, "step": 300 }, { "epoch": 0.025268477574226154, "grad_norm": 5.82253360748291, "learning_rate": 1.6803537586860393e-06, "loss": 0.7179, "step": 400 }, { "epoch": 0.03158559696778269, "grad_norm": 5.032683372497559, "learning_rate": 2.1014950515898086e-06, "loss": 0.6422, "step": 500 }, { "epoch": 0.03158559696778269, "eval_accuracy": 0.7368075050637859, "eval_f1": 0.7170832086299176, "eval_loss": 0.6070035696029663, "eval_precision": 0.7218199142709759, "eval_recall": 0.7368075050637859, "eval_runtime": 582.5178, "eval_samples_per_second": 96.619, "eval_steps_per_second": 3.02, "step": 500 }, { "epoch": 0.03790271636133923, "grad_norm": 7.424877166748047, "learning_rate": 2.5226363444935774e-06, "loss": 0.6155, "step": 600 }, { "epoch": 0.04421983575489577, "grad_norm": 16.976255416870117, "learning_rate": 2.943777637397347e-06, "loss": 0.5944, "step": 700 }, { "epoch": 0.05053695514845231, "grad_norm": 9.103567123413086, "learning_rate": 3.3649189303011164e-06, "loss": 0.5812, "step": 800 }, { "epoch": 0.056854074542008845, "grad_norm": 7.061375617980957, "learning_rate": 3.7860602232048853e-06, "loss": 0.5965, "step": 900 }, { "epoch": 0.06317119393556538, "grad_norm": 6.224503040313721, "learning_rate": 4.207201516108655e-06, "loss": 0.5553, "step": 1000 }, { "epoch": 0.06317119393556538, "eval_accuracy": 0.7581642443409972, "eval_f1": 0.7448374295446439, "eval_loss": 0.5610596537590027, "eval_precision": 0.7461287482946488, "eval_recall": 0.7581642443409972, "eval_runtime": 584.5541, "eval_samples_per_second": 96.282, "eval_steps_per_second": 3.009, "step": 1000 } ], "logging_steps": 100, "max_steps": 47490, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 2104907341824000.0, "train_batch_size": 32, "trial_name": null, "trial_params": null }