| { |
| "best_metric": 0.14741940796375275, |
| "best_model_checkpoint": "./trained_models/twitter-emotion-deberta-v3-base/checkpoint-500", |
| "epoch": 6.0, |
| "global_step": 1200, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.5, |
| "eval_accuracy": 0.8405, |
| "eval_loss": 0.5359936952590942, |
| "eval_runtime": 4.1757, |
| "eval_samples_per_second": 478.965, |
| "eval_steps_per_second": 5.987, |
| "step": 100 |
| }, |
| { |
| "epoch": 1.0, |
| "eval_accuracy": 0.915, |
| "eval_loss": 0.28240880370140076, |
| "eval_runtime": 4.2049, |
| "eval_samples_per_second": 475.638, |
| "eval_steps_per_second": 5.945, |
| "step": 200 |
| }, |
| { |
| "epoch": 1.5, |
| "eval_accuracy": 0.93, |
| "eval_loss": 0.19999809563159943, |
| "eval_runtime": 4.2283, |
| "eval_samples_per_second": 473.002, |
| "eval_steps_per_second": 5.913, |
| "step": 300 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_accuracy": 0.936, |
| "eval_loss": 0.13397051393985748, |
| "eval_runtime": 4.2488, |
| "eval_samples_per_second": 470.716, |
| "eval_steps_per_second": 5.884, |
| "step": 400 |
| }, |
| { |
| "epoch": 2.5, |
| "learning_rate": 2.916666666666667e-05, |
| "loss": 0.4142, |
| "step": 500 |
| }, |
| { |
| "epoch": 2.5, |
| "eval_accuracy": 0.937, |
| "eval_loss": 0.14741940796375275, |
| "eval_runtime": 4.2278, |
| "eval_samples_per_second": 473.054, |
| "eval_steps_per_second": 5.913, |
| "step": 500 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_accuracy": 0.936, |
| "eval_loss": 0.15366272628307343, |
| "eval_runtime": 4.2318, |
| "eval_samples_per_second": 472.612, |
| "eval_steps_per_second": 5.908, |
| "step": 600 |
| }, |
| { |
| "epoch": 3.5, |
| "eval_accuracy": 0.939, |
| "eval_loss": 0.13712549209594727, |
| "eval_runtime": 4.2434, |
| "eval_samples_per_second": 471.315, |
| "eval_steps_per_second": 5.891, |
| "step": 700 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_accuracy": 0.941, |
| "eval_loss": 0.13440823554992676, |
| "eval_runtime": 4.2389, |
| "eval_samples_per_second": 471.816, |
| "eval_steps_per_second": 5.898, |
| "step": 800 |
| }, |
| { |
| "epoch": 4.5, |
| "eval_accuracy": 0.939, |
| "eval_loss": 0.13154806196689606, |
| "eval_runtime": 4.244, |
| "eval_samples_per_second": 471.257, |
| "eval_steps_per_second": 5.891, |
| "step": 900 |
| }, |
| { |
| "epoch": 5.0, |
| "learning_rate": 8.333333333333334e-06, |
| "loss": 0.1013, |
| "step": 1000 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_accuracy": 0.936, |
| "eval_loss": 0.15716207027435303, |
| "eval_runtime": 4.2453, |
| "eval_samples_per_second": 471.109, |
| "eval_steps_per_second": 5.889, |
| "step": 1000 |
| }, |
| { |
| "epoch": 5.5, |
| "eval_accuracy": 0.938, |
| "eval_loss": 0.15671509504318237, |
| "eval_runtime": 4.2362, |
| "eval_samples_per_second": 472.124, |
| "eval_steps_per_second": 5.902, |
| "step": 1100 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_accuracy": 0.939, |
| "eval_loss": 0.15347838401794434, |
| "eval_runtime": 4.2428, |
| "eval_samples_per_second": 471.385, |
| "eval_steps_per_second": 5.892, |
| "step": 1200 |
| }, |
| { |
| "epoch": 6.0, |
| "step": 1200, |
| "total_flos": 6907037114880000.0, |
| "train_loss": 0.2273927664756775, |
| "train_runtime": 627.7316, |
| "train_samples_per_second": 152.932, |
| "train_steps_per_second": 1.912 |
| } |
| ], |
| "max_steps": 1200, |
| "num_train_epochs": 6, |
| "total_flos": 6907037114880000.0, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|