| { |
| "best_metric": 0.07841455936431885, |
| "best_model_checkpoint": "./vit-base-beans/checkpoint-280", |
| "epoch": 0.7608695652173914, |
| "global_step": 280, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.03, |
| "learning_rate": 0.00019322033898305085, |
| "loss": 0.6554, |
| "step": 10 |
| }, |
| { |
| "epoch": 0.05, |
| "learning_rate": 0.0001864406779661017, |
| "loss": 0.306, |
| "step": 20 |
| }, |
| { |
| "epoch": 0.08, |
| "learning_rate": 0.00017966101694915257, |
| "loss": 0.267, |
| "step": 30 |
| }, |
| { |
| "epoch": 0.11, |
| "learning_rate": 0.00017288135593220342, |
| "loss": 0.2825, |
| "step": 40 |
| }, |
| { |
| "epoch": 0.11, |
| "eval_accuracy": 0.9318801089918256, |
| "eval_loss": 0.2294050008058548, |
| "eval_runtime": 16.8062, |
| "eval_samples_per_second": 43.674, |
| "eval_steps_per_second": 5.474, |
| "step": 40 |
| }, |
| { |
| "epoch": 0.14, |
| "learning_rate": 0.00016610169491525423, |
| "loss": 0.3097, |
| "step": 50 |
| }, |
| { |
| "epoch": 0.16, |
| "learning_rate": 0.00015932203389830508, |
| "loss": 0.2772, |
| "step": 60 |
| }, |
| { |
| "epoch": 0.19, |
| "learning_rate": 0.00015254237288135592, |
| "loss": 0.1711, |
| "step": 70 |
| }, |
| { |
| "epoch": 0.22, |
| "learning_rate": 0.00014576271186440677, |
| "loss": 0.1483, |
| "step": 80 |
| }, |
| { |
| "epoch": 0.22, |
| "eval_accuracy": 0.944141689373297, |
| "eval_loss": 0.16020944714546204, |
| "eval_runtime": 17.3798, |
| "eval_samples_per_second": 42.233, |
| "eval_steps_per_second": 5.294, |
| "step": 80 |
| }, |
| { |
| "epoch": 0.24, |
| "learning_rate": 0.00013898305084745764, |
| "loss": 0.2356, |
| "step": 90 |
| }, |
| { |
| "epoch": 0.27, |
| "learning_rate": 0.00013220338983050849, |
| "loss": 0.1144, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.3, |
| "learning_rate": 0.00012542372881355933, |
| "loss": 0.2216, |
| "step": 110 |
| }, |
| { |
| "epoch": 0.33, |
| "learning_rate": 0.00011864406779661017, |
| "loss": 0.2209, |
| "step": 120 |
| }, |
| { |
| "epoch": 0.33, |
| "eval_accuracy": 0.829700272479564, |
| "eval_loss": 0.29767370223999023, |
| "eval_runtime": 17.13, |
| "eval_samples_per_second": 42.849, |
| "eval_steps_per_second": 5.371, |
| "step": 120 |
| }, |
| { |
| "epoch": 0.35, |
| "learning_rate": 0.00011186440677966102, |
| "loss": 0.2153, |
| "step": 130 |
| }, |
| { |
| "epoch": 0.38, |
| "learning_rate": 0.00010508474576271188, |
| "loss": 0.1693, |
| "step": 140 |
| }, |
| { |
| "epoch": 0.41, |
| "learning_rate": 9.830508474576272e-05, |
| "loss": 0.1625, |
| "step": 150 |
| }, |
| { |
| "epoch": 0.43, |
| "learning_rate": 9.152542372881357e-05, |
| "loss": 0.1384, |
| "step": 160 |
| }, |
| { |
| "epoch": 0.43, |
| "eval_accuracy": 0.9645776566757494, |
| "eval_loss": 0.10578873753547668, |
| "eval_runtime": 16.6083, |
| "eval_samples_per_second": 44.195, |
| "eval_steps_per_second": 5.539, |
| "step": 160 |
| }, |
| { |
| "epoch": 0.46, |
| "learning_rate": 8.474576271186441e-05, |
| "loss": 0.1371, |
| "step": 170 |
| }, |
| { |
| "epoch": 0.49, |
| "learning_rate": 7.796610169491526e-05, |
| "loss": 0.1355, |
| "step": 180 |
| }, |
| { |
| "epoch": 0.52, |
| "learning_rate": 7.11864406779661e-05, |
| "loss": 0.1557, |
| "step": 190 |
| }, |
| { |
| "epoch": 0.54, |
| "learning_rate": 6.440677966101695e-05, |
| "loss": 0.1551, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.54, |
| "eval_accuracy": 0.9114441416893733, |
| "eval_loss": 0.1725204885005951, |
| "eval_runtime": 17.0671, |
| "eval_samples_per_second": 43.007, |
| "eval_steps_per_second": 5.39, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.57, |
| "learning_rate": 5.76271186440678e-05, |
| "loss": 0.2091, |
| "step": 210 |
| }, |
| { |
| "epoch": 0.6, |
| "learning_rate": 5.0847457627118643e-05, |
| "loss": 0.1313, |
| "step": 220 |
| }, |
| { |
| "epoch": 0.62, |
| "learning_rate": 4.4067796610169495e-05, |
| "loss": 0.1056, |
| "step": 230 |
| }, |
| { |
| "epoch": 0.65, |
| "learning_rate": 3.728813559322034e-05, |
| "loss": 0.1608, |
| "step": 240 |
| }, |
| { |
| "epoch": 0.65, |
| "eval_accuracy": 0.9673024523160763, |
| "eval_loss": 0.09211871027946472, |
| "eval_runtime": 16.6063, |
| "eval_samples_per_second": 44.2, |
| "eval_steps_per_second": 5.54, |
| "step": 240 |
| }, |
| { |
| "epoch": 0.68, |
| "learning_rate": 3.050847457627119e-05, |
| "loss": 0.0761, |
| "step": 250 |
| }, |
| { |
| "epoch": 0.71, |
| "learning_rate": 2.3728813559322036e-05, |
| "loss": 0.1044, |
| "step": 260 |
| }, |
| { |
| "epoch": 0.73, |
| "learning_rate": 1.694915254237288e-05, |
| "loss": 0.1141, |
| "step": 270 |
| }, |
| { |
| "epoch": 0.76, |
| "learning_rate": 1.016949152542373e-05, |
| "loss": 0.12, |
| "step": 280 |
| }, |
| { |
| "epoch": 0.76, |
| "eval_accuracy": 0.9754768392370572, |
| "eval_loss": 0.07841455936431885, |
| "eval_runtime": 16.7459, |
| "eval_samples_per_second": 43.832, |
| "eval_steps_per_second": 5.494, |
| "step": 280 |
| } |
| ], |
| "max_steps": 295, |
| "num_train_epochs": 1, |
| "total_flos": 3.471672249955123e+17, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|