| { |
| "best_metric": 0.848531684698609, |
| "best_model_checkpoint": "deit-base-patch16-224-FV-finetuned-memes/checkpoint-400", |
| "epoch": 19.987654320987655, |
| "global_step": 400, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.49, |
| "learning_rate": 3e-05, |
| "loss": 1.5611, |
| "step": 10 |
| }, |
| { |
| "epoch": 0.99, |
| "learning_rate": 6e-05, |
| "loss": 1.2733, |
| "step": 20 |
| }, |
| { |
| "epoch": 0.99, |
| "eval_accuracy": 0.5811437403400309, |
| "eval_f1": 0.5292880795121996, |
| "eval_loss": 1.0893372297286987, |
| "eval_precision": 0.5790375140189687, |
| "eval_recall": 0.5811437403400309, |
| "eval_runtime": 14.3471, |
| "eval_samples_per_second": 90.193, |
| "eval_steps_per_second": 1.464, |
| "step": 20 |
| }, |
| { |
| "epoch": 1.49, |
| "learning_rate": 9e-05, |
| "loss": 0.9586, |
| "step": 30 |
| }, |
| { |
| "epoch": 1.99, |
| "learning_rate": 0.00012, |
| "loss": 0.7284, |
| "step": 40 |
| }, |
| { |
| "epoch": 1.99, |
| "eval_accuracy": 0.7210200927357032, |
| "eval_f1": 0.7270557661305002, |
| "eval_loss": 0.7350967526435852, |
| "eval_precision": 0.7642254611707266, |
| "eval_recall": 0.7210200927357032, |
| "eval_runtime": 12.1717, |
| "eval_samples_per_second": 106.312, |
| "eval_steps_per_second": 1.725, |
| "step": 40 |
| }, |
| { |
| "epoch": 2.49, |
| "learning_rate": 0.00011666666666666667, |
| "loss": 0.4906, |
| "step": 50 |
| }, |
| { |
| "epoch": 2.99, |
| "learning_rate": 0.00011333333333333333, |
| "loss": 0.4267, |
| "step": 60 |
| }, |
| { |
| "epoch": 2.99, |
| "eval_accuracy": 0.7990726429675425, |
| "eval_f1": 0.8033064919218132, |
| "eval_loss": 0.5202070474624634, |
| "eval_precision": 0.8104410130277757, |
| "eval_recall": 0.7990726429675425, |
| "eval_runtime": 11.9509, |
| "eval_samples_per_second": 108.276, |
| "eval_steps_per_second": 1.757, |
| "step": 60 |
| }, |
| { |
| "epoch": 3.49, |
| "learning_rate": 0.00011, |
| "loss": 0.2421, |
| "step": 70 |
| }, |
| { |
| "epoch": 3.99, |
| "learning_rate": 0.00010666666666666667, |
| "loss": 0.2181, |
| "step": 80 |
| }, |
| { |
| "epoch": 3.99, |
| "eval_accuracy": 0.8346213292117465, |
| "eval_f1": 0.8333748900624175, |
| "eval_loss": 0.4604855477809906, |
| "eval_precision": 0.8350729859390106, |
| "eval_recall": 0.8346213292117465, |
| "eval_runtime": 12.1854, |
| "eval_samples_per_second": 106.193, |
| "eval_steps_per_second": 1.723, |
| "step": 80 |
| }, |
| { |
| "epoch": 4.49, |
| "learning_rate": 0.00010333333333333334, |
| "loss": 0.1358, |
| "step": 90 |
| }, |
| { |
| "epoch": 4.99, |
| "learning_rate": 0.0001, |
| "loss": 0.1504, |
| "step": 100 |
| }, |
| { |
| "epoch": 4.99, |
| "eval_accuracy": 0.8253477588871716, |
| "eval_f1": 0.8265696468740246, |
| "eval_loss": 0.5281366109848022, |
| "eval_precision": 0.828062631171004, |
| "eval_recall": 0.8253477588871716, |
| "eval_runtime": 12.1945, |
| "eval_samples_per_second": 106.113, |
| "eval_steps_per_second": 1.722, |
| "step": 100 |
| }, |
| { |
| "epoch": 5.49, |
| "learning_rate": 9.666666666666667e-05, |
| "loss": 0.0916, |
| "step": 110 |
| }, |
| { |
| "epoch": 5.99, |
| "learning_rate": 9.333333333333334e-05, |
| "loss": 0.1001, |
| "step": 120 |
| }, |
| { |
| "epoch": 5.99, |
| "eval_accuracy": 0.8369397217928902, |
| "eval_f1": 0.8347021830575708, |
| "eval_loss": 0.49452078342437744, |
| "eval_precision": 0.8335589987471665, |
| "eval_recall": 0.8369397217928902, |
| "eval_runtime": 13.7132, |
| "eval_samples_per_second": 94.362, |
| "eval_steps_per_second": 1.531, |
| "step": 120 |
| }, |
| { |
| "epoch": 6.49, |
| "learning_rate": 9e-05, |
| "loss": 0.0693, |
| "step": 130 |
| }, |
| { |
| "epoch": 6.99, |
| "learning_rate": 8.666666666666667e-05, |
| "loss": 0.0874, |
| "step": 140 |
| }, |
| { |
| "epoch": 6.99, |
| "eval_accuracy": 0.8338485316846986, |
| "eval_f1": 0.8347731418598773, |
| "eval_loss": 0.5901951789855957, |
| "eval_precision": 0.8369841836772862, |
| "eval_recall": 0.8338485316846986, |
| "eval_runtime": 12.1626, |
| "eval_samples_per_second": 106.392, |
| "eval_steps_per_second": 1.727, |
| "step": 140 |
| }, |
| { |
| "epoch": 7.49, |
| "learning_rate": 8.333333333333333e-05, |
| "loss": 0.0698, |
| "step": 150 |
| }, |
| { |
| "epoch": 7.99, |
| "learning_rate": 7.999999999999999e-05, |
| "loss": 0.0634, |
| "step": 160 |
| }, |
| { |
| "epoch": 7.99, |
| "eval_accuracy": 0.8253477588871716, |
| "eval_f1": 0.8234470253240962, |
| "eval_loss": 0.6087659597396851, |
| "eval_precision": 0.8221220381584785, |
| "eval_recall": 0.8253477588871716, |
| "eval_runtime": 12.1235, |
| "eval_samples_per_second": 106.735, |
| "eval_steps_per_second": 1.732, |
| "step": 160 |
| }, |
| { |
| "epoch": 8.49, |
| "learning_rate": 7.666666666666667e-05, |
| "loss": 0.065, |
| "step": 170 |
| }, |
| { |
| "epoch": 8.99, |
| "learning_rate": 7.333333333333334e-05, |
| "loss": 0.0699, |
| "step": 180 |
| }, |
| { |
| "epoch": 8.99, |
| "eval_accuracy": 0.8207109737248841, |
| "eval_f1": 0.8185767382509123, |
| "eval_loss": 0.6210456490516663, |
| "eval_precision": 0.8201740897388502, |
| "eval_recall": 0.8207109737248841, |
| "eval_runtime": 12.2668, |
| "eval_samples_per_second": 105.488, |
| "eval_steps_per_second": 1.712, |
| "step": 180 |
| }, |
| { |
| "epoch": 9.49, |
| "learning_rate": 7.000000000000001e-05, |
| "loss": 0.0548, |
| "step": 190 |
| }, |
| { |
| "epoch": 9.99, |
| "learning_rate": 6.666666666666667e-05, |
| "loss": 0.0661, |
| "step": 200 |
| }, |
| { |
| "epoch": 9.99, |
| "eval_accuracy": 0.8384853168469861, |
| "eval_f1": 0.8392602772109944, |
| "eval_loss": 0.567503809928894, |
| "eval_precision": 0.8416984089400088, |
| "eval_recall": 0.8384853168469861, |
| "eval_runtime": 13.1333, |
| "eval_samples_per_second": 98.528, |
| "eval_steps_per_second": 1.599, |
| "step": 200 |
| }, |
| { |
| "epoch": 10.49, |
| "learning_rate": 6.333333333333333e-05, |
| "loss": 0.0584, |
| "step": 210 |
| }, |
| { |
| "epoch": 10.99, |
| "learning_rate": 6e-05, |
| "loss": 0.0592, |
| "step": 220 |
| }, |
| { |
| "epoch": 10.99, |
| "eval_accuracy": 0.8253477588871716, |
| "eval_f1": 0.8275102000168703, |
| "eval_loss": 0.6549890041351318, |
| "eval_precision": 0.8324336806598226, |
| "eval_recall": 0.8253477588871716, |
| "eval_runtime": 12.4308, |
| "eval_samples_per_second": 104.096, |
| "eval_steps_per_second": 1.689, |
| "step": 220 |
| }, |
| { |
| "epoch": 11.49, |
| "learning_rate": 5.6666666666666664e-05, |
| "loss": 0.0547, |
| "step": 230 |
| }, |
| { |
| "epoch": 11.99, |
| "learning_rate": 5.333333333333333e-05, |
| "loss": 0.0559, |
| "step": 240 |
| }, |
| { |
| "epoch": 11.99, |
| "eval_accuracy": 0.8415765069551777, |
| "eval_f1": 0.8386771501165272, |
| "eval_loss": 0.6400041580200195, |
| "eval_precision": 0.8369803259815121, |
| "eval_recall": 0.8415765069551777, |
| "eval_runtime": 12.0827, |
| "eval_samples_per_second": 107.095, |
| "eval_steps_per_second": 1.738, |
| "step": 240 |
| }, |
| { |
| "epoch": 12.49, |
| "learning_rate": 5e-05, |
| "loss": 0.0544, |
| "step": 250 |
| }, |
| { |
| "epoch": 12.99, |
| "learning_rate": 4.666666666666667e-05, |
| "loss": 0.0501, |
| "step": 260 |
| }, |
| { |
| "epoch": 12.99, |
| "eval_accuracy": 0.839258114374034, |
| "eval_f1": 0.8349827197339503, |
| "eval_loss": 0.6725842952728271, |
| "eval_precision": 0.8352807610136271, |
| "eval_recall": 0.839258114374034, |
| "eval_runtime": 12.235, |
| "eval_samples_per_second": 105.762, |
| "eval_steps_per_second": 1.716, |
| "step": 260 |
| }, |
| { |
| "epoch": 13.49, |
| "learning_rate": 4.3333333333333334e-05, |
| "loss": 0.0504, |
| "step": 270 |
| }, |
| { |
| "epoch": 13.99, |
| "learning_rate": 3.9999999999999996e-05, |
| "loss": 0.0529, |
| "step": 280 |
| }, |
| { |
| "epoch": 13.99, |
| "eval_accuracy": 0.8408037094281299, |
| "eval_f1": 0.8401045386097177, |
| "eval_loss": 0.6284657120704651, |
| "eval_precision": 0.8399002499413157, |
| "eval_recall": 0.8408037094281299, |
| "eval_runtime": 12.1571, |
| "eval_samples_per_second": 106.44, |
| "eval_steps_per_second": 1.727, |
| "step": 280 |
| }, |
| { |
| "epoch": 14.49, |
| "learning_rate": 3.666666666666667e-05, |
| "loss": 0.0483, |
| "step": 290 |
| }, |
| { |
| "epoch": 14.99, |
| "learning_rate": 3.3333333333333335e-05, |
| "loss": 0.0478, |
| "step": 300 |
| }, |
| { |
| "epoch": 14.99, |
| "eval_accuracy": 0.8400309119010819, |
| "eval_f1": 0.8384325271224449, |
| "eval_loss": 0.6423028707504272, |
| "eval_precision": 0.8380083960258947, |
| "eval_recall": 0.8400309119010819, |
| "eval_runtime": 13.5896, |
| "eval_samples_per_second": 95.22, |
| "eval_steps_per_second": 1.545, |
| "step": 300 |
| }, |
| { |
| "epoch": 15.49, |
| "learning_rate": 3e-05, |
| "loss": 0.0511, |
| "step": 310 |
| }, |
| { |
| "epoch": 15.99, |
| "learning_rate": 2.6666666666666667e-05, |
| "loss": 0.0458, |
| "step": 320 |
| }, |
| { |
| "epoch": 15.99, |
| "eval_accuracy": 0.8369397217928902, |
| "eval_f1": 0.8347511755501414, |
| "eval_loss": 0.6632058620452881, |
| "eval_precision": 0.8336581851460658, |
| "eval_recall": 0.8369397217928902, |
| "eval_runtime": 12.2903, |
| "eval_samples_per_second": 105.286, |
| "eval_steps_per_second": 1.709, |
| "step": 320 |
| }, |
| { |
| "epoch": 16.49, |
| "learning_rate": 2.3333333333333336e-05, |
| "loss": 0.044, |
| "step": 330 |
| }, |
| { |
| "epoch": 16.99, |
| "learning_rate": 1.9999999999999998e-05, |
| "loss": 0.048, |
| "step": 340 |
| }, |
| { |
| "epoch": 16.99, |
| "eval_accuracy": 0.8423493044822257, |
| "eval_f1": 0.8403953031110398, |
| "eval_loss": 0.6718657612800598, |
| "eval_precision": 0.8400986650043714, |
| "eval_recall": 0.8423493044822257, |
| "eval_runtime": 12.1549, |
| "eval_samples_per_second": 106.459, |
| "eval_steps_per_second": 1.728, |
| "step": 340 |
| }, |
| { |
| "epoch": 17.49, |
| "learning_rate": 1.6666666666666667e-05, |
| "loss": 0.0531, |
| "step": 350 |
| }, |
| { |
| "epoch": 17.99, |
| "learning_rate": 1.3333333333333333e-05, |
| "loss": 0.0417, |
| "step": 360 |
| }, |
| { |
| "epoch": 17.99, |
| "eval_accuracy": 0.8423493044822257, |
| "eval_f1": 0.8408137285370694, |
| "eval_loss": 0.6807297468185425, |
| "eval_precision": 0.8414734958978292, |
| "eval_recall": 0.8423493044822257, |
| "eval_runtime": 12.1578, |
| "eval_samples_per_second": 106.434, |
| "eval_steps_per_second": 1.727, |
| "step": 360 |
| }, |
| { |
| "epoch": 18.49, |
| "learning_rate": 9.999999999999999e-06, |
| "loss": 0.0463, |
| "step": 370 |
| }, |
| { |
| "epoch": 18.99, |
| "learning_rate": 6.666666666666667e-06, |
| "loss": 0.0461, |
| "step": 380 |
| }, |
| { |
| "epoch": 18.99, |
| "eval_accuracy": 0.8454404945904173, |
| "eval_f1": 0.8437536089910989, |
| "eval_loss": 0.6732441782951355, |
| "eval_precision": 0.8439655958777214, |
| "eval_recall": 0.8454404945904173, |
| "eval_runtime": 12.2922, |
| "eval_samples_per_second": 105.27, |
| "eval_steps_per_second": 1.708, |
| "step": 380 |
| }, |
| { |
| "epoch": 19.49, |
| "learning_rate": 3.3333333333333333e-06, |
| "loss": 0.0467, |
| "step": 390 |
| }, |
| { |
| "epoch": 19.99, |
| "learning_rate": 0.0, |
| "loss": 0.044, |
| "step": 400 |
| }, |
| { |
| "epoch": 19.99, |
| "eval_accuracy": 0.848531684698609, |
| "eval_f1": 0.8463625265241504, |
| "eval_loss": 0.6769371628761292, |
| "eval_precision": 0.8458069264500935, |
| "eval_recall": 0.848531684698609, |
| "eval_runtime": 13.4679, |
| "eval_samples_per_second": 96.08, |
| "eval_steps_per_second": 1.559, |
| "step": 400 |
| }, |
| { |
| "epoch": 19.99, |
| "step": 400, |
| "total_flos": 8.014902017179374e+18, |
| "train_loss": 0.19803269907832147, |
| "train_runtime": 1524.6859, |
| "train_samples_per_second": 67.87, |
| "train_steps_per_second": 0.262 |
| } |
| ], |
| "max_steps": 400, |
| "num_train_epochs": 20, |
| "total_flos": 8.014902017179374e+18, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|