| { | |
| "best_metric": 1.1392158269882202, | |
| "best_model_checkpoint": "./vit-artworkclassifier\\checkpoint-600", | |
| "epoch": 4.0, | |
| "global_step": 1112, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.18, | |
| "learning_rate": 9.550359712230216e-05, | |
| "loss": 1.9425, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "learning_rate": 9.100719424460432e-05, | |
| "loss": 1.5906, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "eval_accuracy": 0.48467650397275824, | |
| "eval_loss": 1.4708987474441528, | |
| "eval_runtime": 7.3715, | |
| "eval_samples_per_second": 119.514, | |
| "eval_steps_per_second": 15.058, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "learning_rate": 8.651079136690648e-05, | |
| "loss": 1.4388, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "learning_rate": 8.201438848920863e-05, | |
| "loss": 1.3395, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "eval_accuracy": 0.5073779795686719, | |
| "eval_loss": 1.3207731246948242, | |
| "eval_runtime": 7.4035, | |
| "eval_samples_per_second": 118.998, | |
| "eval_steps_per_second": 14.993, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "learning_rate": 7.751798561151079e-05, | |
| "loss": 1.3275, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "learning_rate": 7.302158273381295e-05, | |
| "loss": 1.1461, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "eval_accuracy": 0.5164585698070374, | |
| "eval_loss": 1.3362975120544434, | |
| "eval_runtime": 7.64, | |
| "eval_samples_per_second": 115.314, | |
| "eval_steps_per_second": 14.529, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 1.26, | |
| "learning_rate": 6.852517985611511e-05, | |
| "loss": 0.9749, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "learning_rate": 6.402877697841726e-05, | |
| "loss": 0.9593, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "eval_accuracy": 0.5845629965947786, | |
| "eval_loss": 1.1789547204971313, | |
| "eval_runtime": 7.248, | |
| "eval_samples_per_second": 121.551, | |
| "eval_steps_per_second": 15.315, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "learning_rate": 5.953237410071942e-05, | |
| "loss": 0.9175, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "learning_rate": 5.512589928057554e-05, | |
| "loss": 0.8761, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_accuracy": 0.5902383654937571, | |
| "eval_loss": 1.1252126693725586, | |
| "eval_runtime": 7.2535, | |
| "eval_samples_per_second": 121.459, | |
| "eval_steps_per_second": 15.303, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "learning_rate": 5.06294964028777e-05, | |
| "loss": 0.8615, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 2.16, | |
| "learning_rate": 4.613309352517986e-05, | |
| "loss": 0.5922, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 2.16, | |
| "eval_accuracy": 0.5947786606129398, | |
| "eval_loss": 1.1392158269882202, | |
| "eval_runtime": 7.5695, | |
| "eval_samples_per_second": 116.388, | |
| "eval_steps_per_second": 14.664, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 2.34, | |
| "learning_rate": 4.163669064748202e-05, | |
| "loss": 0.4684, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 2.52, | |
| "learning_rate": 3.714028776978418e-05, | |
| "loss": 0.4803, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 2.52, | |
| "eval_accuracy": 0.5936435868331441, | |
| "eval_loss": 1.1560313701629639, | |
| "eval_runtime": 7.3175, | |
| "eval_samples_per_second": 120.396, | |
| "eval_steps_per_second": 15.169, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 2.7, | |
| "learning_rate": 3.2643884892086335e-05, | |
| "loss": 0.4766, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 2.88, | |
| "learning_rate": 2.8147482014388493e-05, | |
| "loss": 0.4454, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 2.88, | |
| "eval_accuracy": 0.6118047673098751, | |
| "eval_loss": 1.1545273065567017, | |
| "eval_runtime": 7.2475, | |
| "eval_samples_per_second": 121.559, | |
| "eval_steps_per_second": 15.316, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 3.06, | |
| "learning_rate": 2.3651079136690647e-05, | |
| "loss": 0.371, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 3.24, | |
| "learning_rate": 1.9154676258992808e-05, | |
| "loss": 0.2271, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 3.24, | |
| "eval_accuracy": 0.6038592508513053, | |
| "eval_loss": 1.2283731698989868, | |
| "eval_runtime": 7.1705, | |
| "eval_samples_per_second": 122.865, | |
| "eval_steps_per_second": 15.48, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 3.42, | |
| "learning_rate": 1.4658273381294965e-05, | |
| "loss": 0.2249, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 3.6, | |
| "learning_rate": 1.0161870503597123e-05, | |
| "loss": 0.207, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 3.6, | |
| "eval_accuracy": 0.5959137343927355, | |
| "eval_loss": 1.262502670288086, | |
| "eval_runtime": 7.2385, | |
| "eval_samples_per_second": 121.71, | |
| "eval_steps_per_second": 15.335, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 3.78, | |
| "learning_rate": 5.665467625899281e-06, | |
| "loss": 0.1906, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 3.96, | |
| "learning_rate": 1.169064748201439e-06, | |
| "loss": 0.1958, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 3.96, | |
| "eval_accuracy": 0.6004540295119183, | |
| "eval_loss": 1.262100338935852, | |
| "eval_runtime": 7.2855, | |
| "eval_samples_per_second": 120.925, | |
| "eval_steps_per_second": 15.236, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "step": 1112, | |
| "total_flos": 2.7542380976164454e+18, | |
| "train_loss": 0.7775138853479633, | |
| "train_runtime": 613.7183, | |
| "train_samples_per_second": 57.909, | |
| "train_steps_per_second": 1.812 | |
| } | |
| ], | |
| "max_steps": 1112, | |
| "num_train_epochs": 4, | |
| "total_flos": 2.7542380976164454e+18, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |