| { | |
| "best_metric": 0.9571847507331379, | |
| "best_model_checkpoint": "twitter-roberta-base-CoNLL/checkpoint-2000", | |
| "epoch": 10.0, | |
| "global_step": 2200, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.11, | |
| "eval_accuracy": 0.9385927339278065, | |
| "eval_f1": 0.6587314799400699, | |
| "eval_loss": 0.2062799483537674, | |
| "eval_precision": 0.6516798418972332, | |
| "eval_recall": 0.6659373948165601, | |
| "eval_runtime": 5.976, | |
| "eval_samples_per_second": 544.011, | |
| "eval_steps_per_second": 0.669, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 0.23, | |
| "eval_accuracy": 0.9771231649857871, | |
| "eval_f1": 0.8565321055660609, | |
| "eval_loss": 0.08096875995397568, | |
| "eval_precision": 0.8373251888763864, | |
| "eval_recall": 0.8766408616627398, | |
| "eval_runtime": 6.2407, | |
| "eval_samples_per_second": 520.938, | |
| "eval_steps_per_second": 0.641, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_accuracy": 0.9826914839764807, | |
| "eval_f1": 0.8996990972918756, | |
| "eval_loss": 0.06511491537094116, | |
| "eval_precision": 0.8937230156094321, | |
| "eval_recall": 0.9057556378323797, | |
| "eval_runtime": 6.0069, | |
| "eval_samples_per_second": 541.208, | |
| "eval_steps_per_second": 0.666, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "eval_accuracy": 0.9849110237140298, | |
| "eval_f1": 0.907388833166165, | |
| "eval_loss": 0.05366199463605881, | |
| "eval_precision": 0.9013616738625041, | |
| "eval_recall": 0.9134971390104342, | |
| "eval_runtime": 6.3828, | |
| "eval_samples_per_second": 509.335, | |
| "eval_steps_per_second": 0.627, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "eval_accuracy": 0.986682761574705, | |
| "eval_f1": 0.9170283806343906, | |
| "eval_loss": 0.04637985676527023, | |
| "eval_precision": 0.9097383239483272, | |
| "eval_recall": 0.924436216762033, | |
| "eval_runtime": 6.0475, | |
| "eval_samples_per_second": 537.576, | |
| "eval_steps_per_second": 0.661, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 0.68, | |
| "eval_accuracy": 0.9884544994353802, | |
| "eval_f1": 0.9296410942859533, | |
| "eval_loss": 0.042301442474126816, | |
| "eval_precision": 0.9243054400266179, | |
| "eval_recall": 0.9350387075058902, | |
| "eval_runtime": 6.0733, | |
| "eval_samples_per_second": 535.298, | |
| "eval_steps_per_second": 0.659, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "eval_accuracy": 0.9899731318873876, | |
| "eval_f1": 0.934277384423157, | |
| "eval_loss": 0.038059305399656296, | |
| "eval_precision": 0.9249546429160481, | |
| "eval_recall": 0.9437899697071693, | |
| "eval_runtime": 6.3028, | |
| "eval_samples_per_second": 515.805, | |
| "eval_steps_per_second": 0.635, | |
| "step": 175 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "eval_accuracy": 0.9895642693041549, | |
| "eval_f1": 0.9354220481626531, | |
| "eval_loss": 0.038840554654598236, | |
| "eval_precision": 0.9263904934807724, | |
| "eval_recall": 0.9446314372265231, | |
| "eval_runtime": 6.0497, | |
| "eval_samples_per_second": 537.384, | |
| "eval_steps_per_second": 0.661, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "eval_accuracy": 0.9898368443596434, | |
| "eval_f1": 0.9384409501505521, | |
| "eval_loss": 0.03943933546543121, | |
| "eval_precision": 0.9328234120385767, | |
| "eval_recall": 0.9441265567149109, | |
| "eval_runtime": 6.4439, | |
| "eval_samples_per_second": 504.505, | |
| "eval_steps_per_second": 0.621, | |
| "step": 225 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_accuracy": 0.9895837389509754, | |
| "eval_f1": 0.9402710389827672, | |
| "eval_loss": 0.042259786278009415, | |
| "eval_precision": 0.9347970725216235, | |
| "eval_recall": 0.9458094917536183, | |
| "eval_runtime": 6.16, | |
| "eval_samples_per_second": 527.761, | |
| "eval_steps_per_second": 0.649, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "eval_accuracy": 0.9892138156613839, | |
| "eval_f1": 0.9354757720311323, | |
| "eval_loss": 0.04323225095868111, | |
| "eval_precision": 0.9304145163975363, | |
| "eval_recall": 0.9405923931336251, | |
| "eval_runtime": 6.3592, | |
| "eval_samples_per_second": 511.225, | |
| "eval_steps_per_second": 0.629, | |
| "step": 275 | |
| }, | |
| { | |
| "epoch": 1.36, | |
| "eval_accuracy": 0.9900899497683112, | |
| "eval_f1": 0.9432760787599497, | |
| "eval_loss": 0.03824295476078987, | |
| "eval_precision": 0.9392624728850325, | |
| "eval_recall": 0.9473241332884551, | |
| "eval_runtime": 6.1034, | |
| "eval_samples_per_second": 532.654, | |
| "eval_steps_per_second": 0.655, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "eval_accuracy": 0.99005101047467, | |
| "eval_f1": 0.9414020171709594, | |
| "eval_loss": 0.0380987711250782, | |
| "eval_precision": 0.932617671345995, | |
| "eval_recall": 0.9503534163581285, | |
| "eval_runtime": 6.1204, | |
| "eval_samples_per_second": 531.176, | |
| "eval_steps_per_second": 0.654, | |
| "step": 325 | |
| }, | |
| { | |
| "epoch": 1.59, | |
| "eval_accuracy": 0.9902262372960554, | |
| "eval_f1": 0.9429309339331834, | |
| "eval_loss": 0.03868376836180687, | |
| "eval_precision": 0.933674311169774, | |
| "eval_recall": 0.9523729384045776, | |
| "eval_runtime": 6.3273, | |
| "eval_samples_per_second": 513.801, | |
| "eval_steps_per_second": 0.632, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "eval_accuracy": 0.990148358708773, | |
| "eval_f1": 0.9439181825802665, | |
| "eval_loss": 0.03645554929971695, | |
| "eval_precision": 0.9403708034073827, | |
| "eval_recall": 0.9474924267923258, | |
| "eval_runtime": 6.2492, | |
| "eval_samples_per_second": 520.224, | |
| "eval_steps_per_second": 0.64, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "eval_accuracy": 0.9905182819983646, | |
| "eval_f1": 0.9473948735131512, | |
| "eval_loss": 0.0382225401699543, | |
| "eval_precision": 0.9431287525016678, | |
| "eval_recall": 0.9516997643890945, | |
| "eval_runtime": 6.4588, | |
| "eval_samples_per_second": 503.348, | |
| "eval_steps_per_second": 0.619, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "eval_accuracy": 0.9903235855301585, | |
| "eval_f1": 0.9460837582546184, | |
| "eval_loss": 0.03733981028199196, | |
| "eval_precision": 0.9398770968277694, | |
| "eval_recall": 0.9523729384045776, | |
| "eval_runtime": 6.1594, | |
| "eval_samples_per_second": 527.813, | |
| "eval_steps_per_second": 0.649, | |
| "step": 425 | |
| }, | |
| { | |
| "epoch": 2.05, | |
| "eval_accuracy": 0.9910439624625209, | |
| "eval_f1": 0.9497365559923059, | |
| "eval_loss": 0.03666611388325691, | |
| "eval_precision": 0.943973399833749, | |
| "eval_recall": 0.9555705149781218, | |
| "eval_runtime": 6.4014, | |
| "eval_samples_per_second": 507.859, | |
| "eval_steps_per_second": 0.625, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 2.16, | |
| "eval_accuracy": 0.99069350881975, | |
| "eval_f1": 0.9474914433592119, | |
| "eval_loss": 0.03960287570953369, | |
| "eval_precision": 0.9400364419413616, | |
| "eval_recall": 0.9550656344665096, | |
| "eval_runtime": 6.2344, | |
| "eval_samples_per_second": 521.465, | |
| "eval_steps_per_second": 0.642, | |
| "step": 475 | |
| }, | |
| { | |
| "epoch": 2.27, | |
| "learning_rate": 4.636363636363636e-05, | |
| "loss": 0.0771, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.27, | |
| "eval_accuracy": 0.991238658930727, | |
| "eval_f1": 0.9507813152836967, | |
| "eval_loss": 0.035283163189888, | |
| "eval_precision": 0.9442323651452282, | |
| "eval_recall": 0.9574217435207001, | |
| "eval_runtime": 6.1631, | |
| "eval_samples_per_second": 527.493, | |
| "eval_steps_per_second": 0.649, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.39, | |
| "eval_accuracy": 0.9905572212920057, | |
| "eval_f1": 0.9453602209020165, | |
| "eval_loss": 0.03937030956149101, | |
| "eval_precision": 0.9400898652021967, | |
| "eval_recall": 0.9506900033658701, | |
| "eval_runtime": 6.243, | |
| "eval_samples_per_second": 520.742, | |
| "eval_steps_per_second": 0.641, | |
| "step": 525 | |
| }, | |
| { | |
| "epoch": 2.5, | |
| "eval_accuracy": 0.9909660838752385, | |
| "eval_f1": 0.9484536082474228, | |
| "eval_loss": 0.036998968571424484, | |
| "eval_precision": 0.9447320086825848, | |
| "eval_recall": 0.9522046449007069, | |
| "eval_runtime": 6.0773, | |
| "eval_samples_per_second": 534.945, | |
| "eval_steps_per_second": 0.658, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 2.61, | |
| "eval_accuracy": 0.9908492659943149, | |
| "eval_f1": 0.9472013366750209, | |
| "eval_loss": 0.035233963280916214, | |
| "eval_precision": 0.940444591904446, | |
| "eval_recall": 0.9540558734432851, | |
| "eval_runtime": 6.3038, | |
| "eval_samples_per_second": 515.72, | |
| "eval_steps_per_second": 0.635, | |
| "step": 575 | |
| }, | |
| { | |
| "epoch": 2.73, | |
| "eval_accuracy": 0.9908103267006737, | |
| "eval_f1": 0.9448281601065159, | |
| "eval_loss": 0.0385683998465538, | |
| "eval_precision": 0.9344855967078189, | |
| "eval_recall": 0.9554022214742511, | |
| "eval_runtime": 6.1499, | |
| "eval_samples_per_second": 528.629, | |
| "eval_steps_per_second": 0.65, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 2.84, | |
| "eval_accuracy": 0.9916280518671391, | |
| "eval_f1": 0.9501544627202138, | |
| "eval_loss": 0.036591168493032455, | |
| "eval_precision": 0.9428334714167357, | |
| "eval_recall": 0.9575900370245709, | |
| "eval_runtime": 6.1996, | |
| "eval_samples_per_second": 524.389, | |
| "eval_steps_per_second": 0.645, | |
| "step": 625 | |
| }, | |
| { | |
| "epoch": 2.95, | |
| "eval_accuracy": 0.9913360071648301, | |
| "eval_f1": 0.948574295509658, | |
| "eval_loss": 0.035347189754247665, | |
| "eval_precision": 0.9426624563736081, | |
| "eval_recall": 0.9545607539548974, | |
| "eval_runtime": 6.4287, | |
| "eval_samples_per_second": 505.702, | |
| "eval_steps_per_second": 0.622, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 3.07, | |
| "eval_accuracy": 0.9911023714029827, | |
| "eval_f1": 0.9477730425336343, | |
| "eval_loss": 0.035899706184864044, | |
| "eval_precision": 0.9412448132780084, | |
| "eval_recall": 0.9543924604510265, | |
| "eval_runtime": 6.1591, | |
| "eval_samples_per_second": 527.837, | |
| "eval_steps_per_second": 0.649, | |
| "step": 675 | |
| }, | |
| { | |
| "epoch": 3.18, | |
| "eval_accuracy": 0.9919979751567306, | |
| "eval_f1": 0.9534164087981936, | |
| "eval_loss": 0.0355631485581398, | |
| "eval_precision": 0.9476309226932669, | |
| "eval_recall": 0.9592729720632783, | |
| "eval_runtime": 6.1923, | |
| "eval_samples_per_second": 525.005, | |
| "eval_steps_per_second": 0.646, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 3.3, | |
| "eval_accuracy": 0.9918422179821658, | |
| "eval_f1": 0.953465015065283, | |
| "eval_loss": 0.03445196524262428, | |
| "eval_precision": 0.9483849483849484, | |
| "eval_recall": 0.9585997980477954, | |
| "eval_runtime": 6.3335, | |
| "eval_samples_per_second": 513.302, | |
| "eval_steps_per_second": 0.632, | |
| "step": 725 | |
| }, | |
| { | |
| "epoch": 3.41, | |
| "eval_accuracy": 0.9915696429266773, | |
| "eval_f1": 0.9491893698813304, | |
| "eval_loss": 0.03445504605770111, | |
| "eval_precision": 0.9427290836653387, | |
| "eval_recall": 0.9557388084819926, | |
| "eval_runtime": 6.1661, | |
| "eval_samples_per_second": 527.234, | |
| "eval_steps_per_second": 0.649, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 3.52, | |
| "eval_accuracy": 0.9913944161052919, | |
| "eval_f1": 0.9478246374395733, | |
| "eval_loss": 0.03635535016655922, | |
| "eval_precision": 0.9389035667107001, | |
| "eval_recall": 0.9569168630090878, | |
| "eval_runtime": 6.4373, | |
| "eval_samples_per_second": 505.028, | |
| "eval_steps_per_second": 0.621, | |
| "step": 775 | |
| }, | |
| { | |
| "epoch": 3.64, | |
| "eval_accuracy": 0.9914917643393949, | |
| "eval_f1": 0.95067189717052, | |
| "eval_loss": 0.03599384054541588, | |
| "eval_precision": 0.943036926643484, | |
| "eval_recall": 0.9584315045439246, | |
| "eval_runtime": 6.1546, | |
| "eval_samples_per_second": 528.219, | |
| "eval_steps_per_second": 0.65, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 3.75, | |
| "eval_accuracy": 0.9914528250457537, | |
| "eval_f1": 0.950514945993469, | |
| "eval_loss": 0.03866244852542877, | |
| "eval_precision": 0.9458423596067322, | |
| "eval_recall": 0.9552339279703803, | |
| "eval_runtime": 6.3798, | |
| "eval_samples_per_second": 509.575, | |
| "eval_steps_per_second": 0.627, | |
| "step": 825 | |
| }, | |
| { | |
| "epoch": 3.86, | |
| "eval_accuracy": 0.9917059304544216, | |
| "eval_f1": 0.9521419009370816, | |
| "eval_loss": 0.034695982933044434, | |
| "eval_precision": 0.9467554076539102, | |
| "eval_recall": 0.9575900370245709, | |
| "eval_runtime": 6.175, | |
| "eval_samples_per_second": 526.482, | |
| "eval_steps_per_second": 0.648, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 3.98, | |
| "eval_accuracy": 0.9915307036330361, | |
| "eval_f1": 0.9509402423735897, | |
| "eval_loss": 0.03567422926425934, | |
| "eval_precision": 0.9445459073551387, | |
| "eval_recall": 0.9574217435207001, | |
| "eval_runtime": 6.2028, | |
| "eval_samples_per_second": 524.119, | |
| "eval_steps_per_second": 0.645, | |
| "step": 875 | |
| }, | |
| { | |
| "epoch": 4.09, | |
| "eval_accuracy": 0.9918032786885246, | |
| "eval_f1": 0.9520702634880803, | |
| "eval_loss": 0.03815401718020439, | |
| "eval_precision": 0.9464493597206054, | |
| "eval_recall": 0.9577583305284416, | |
| "eval_runtime": 6.4111, | |
| "eval_samples_per_second": 507.091, | |
| "eval_steps_per_second": 0.624, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 4.2, | |
| "eval_accuracy": 0.9917643393948834, | |
| "eval_f1": 0.9518385124382277, | |
| "eval_loss": 0.03912338241934776, | |
| "eval_precision": 0.9474737368684342, | |
| "eval_recall": 0.9562436889936049, | |
| "eval_runtime": 6.1023, | |
| "eval_samples_per_second": 532.748, | |
| "eval_steps_per_second": 0.655, | |
| "step": 925 | |
| }, | |
| { | |
| "epoch": 4.32, | |
| "eval_accuracy": 0.9911802499902652, | |
| "eval_f1": 0.9506493506493505, | |
| "eval_loss": 0.0428401380777359, | |
| "eval_precision": 0.9466043717670616, | |
| "eval_recall": 0.9547290474587681, | |
| "eval_runtime": 6.3492, | |
| "eval_samples_per_second": 512.03, | |
| "eval_steps_per_second": 0.63, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 4.43, | |
| "eval_accuracy": 0.9913360071648301, | |
| "eval_f1": 0.9506028131279304, | |
| "eval_loss": 0.04035865515470505, | |
| "eval_precision": 0.9458513828723759, | |
| "eval_recall": 0.9554022214742511, | |
| "eval_runtime": 6.1625, | |
| "eval_samples_per_second": 527.542, | |
| "eval_steps_per_second": 0.649, | |
| "step": 975 | |
| }, | |
| { | |
| "epoch": 4.55, | |
| "learning_rate": 3.2727272727272725e-05, | |
| "loss": 0.0118, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 4.55, | |
| "eval_accuracy": 0.9908687356411354, | |
| "eval_f1": 0.9461397365349341, | |
| "eval_loss": 0.04028761386871338, | |
| "eval_precision": 0.9375413086582948, | |
| "eval_recall": 0.9548973409626389, | |
| "eval_runtime": 6.261, | |
| "eval_samples_per_second": 519.243, | |
| "eval_steps_per_second": 0.639, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 4.66, | |
| "eval_accuracy": 0.9919200965694482, | |
| "eval_f1": 0.9533852205205458, | |
| "eval_loss": 0.036938250064849854, | |
| "eval_precision": 0.9482270684201765, | |
| "eval_recall": 0.9585997980477954, | |
| "eval_runtime": 6.1962, | |
| "eval_samples_per_second": 524.674, | |
| "eval_steps_per_second": 0.646, | |
| "step": 1025 | |
| }, | |
| { | |
| "epoch": 4.77, | |
| "eval_accuracy": 0.9918032786885246, | |
| "eval_f1": 0.9520227348712804, | |
| "eval_loss": 0.037420712411403656, | |
| "eval_precision": 0.9456991032879442, | |
| "eval_recall": 0.9584315045439246, | |
| "eval_runtime": 5.9766, | |
| "eval_samples_per_second": 543.958, | |
| "eval_steps_per_second": 0.669, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 4.89, | |
| "eval_accuracy": 0.9922900198590398, | |
| "eval_f1": 0.9538745387453874, | |
| "eval_loss": 0.035940222442150116, | |
| "eval_precision": 0.9506853895018389, | |
| "eval_recall": 0.9570851565129586, | |
| "eval_runtime": 6.2768, | |
| "eval_samples_per_second": 517.943, | |
| "eval_steps_per_second": 0.637, | |
| "step": 1075 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.9919006269226276, | |
| "eval_f1": 0.9523093627328155, | |
| "eval_loss": 0.03730743005871773, | |
| "eval_precision": 0.9452827060189023, | |
| "eval_recall": 0.9594412655671491, | |
| "eval_runtime": 6.0853, | |
| "eval_samples_per_second": 534.236, | |
| "eval_steps_per_second": 0.657, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 5.11, | |
| "eval_accuracy": 0.9923873680931428, | |
| "eval_f1": 0.9546215673141327, | |
| "eval_loss": 0.037039875984191895, | |
| "eval_precision": 0.9498500499833389, | |
| "eval_recall": 0.9594412655671491, | |
| "eval_runtime": 6.3128, | |
| "eval_samples_per_second": 514.986, | |
| "eval_steps_per_second": 0.634, | |
| "step": 1125 | |
| }, | |
| { | |
| "epoch": 5.23, | |
| "eval_accuracy": 0.9922316109185779, | |
| "eval_f1": 0.9555313625324512, | |
| "eval_loss": 0.038839343935251236, | |
| "eval_precision": 0.9509918319719953, | |
| "eval_recall": 0.9601144395826321, | |
| "eval_runtime": 6.1584, | |
| "eval_samples_per_second": 527.897, | |
| "eval_steps_per_second": 0.65, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 5.34, | |
| "eval_accuracy": 0.9919785055099101, | |
| "eval_f1": 0.9522212908633696, | |
| "eval_loss": 0.03950090706348419, | |
| "eval_precision": 0.948563794255177, | |
| "eval_recall": 0.9559071019858634, | |
| "eval_runtime": 6.084, | |
| "eval_samples_per_second": 534.349, | |
| "eval_steps_per_second": 0.657, | |
| "step": 1175 | |
| }, | |
| { | |
| "epoch": 5.45, | |
| "eval_accuracy": 0.9923678984463222, | |
| "eval_f1": 0.9542866711319491, | |
| "eval_loss": 0.03910110890865326, | |
| "eval_precision": 0.949516827724092, | |
| "eval_recall": 0.9591046785594076, | |
| "eval_runtime": 6.3281, | |
| "eval_samples_per_second": 513.744, | |
| "eval_steps_per_second": 0.632, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 5.57, | |
| "eval_accuracy": 0.9923289591526809, | |
| "eval_f1": 0.9552313883299799, | |
| "eval_loss": 0.037824589759111404, | |
| "eval_precision": 0.9517206815903776, | |
| "eval_recall": 0.9587680915516661, | |
| "eval_runtime": 6.1901, | |
| "eval_samples_per_second": 525.192, | |
| "eval_steps_per_second": 0.646, | |
| "step": 1225 | |
| }, | |
| { | |
| "epoch": 5.68, | |
| "eval_accuracy": 0.9923678984463222, | |
| "eval_f1": 0.956470785200067, | |
| "eval_loss": 0.038752481341362, | |
| "eval_precision": 0.9515323117921386, | |
| "eval_recall": 0.9614607876135981, | |
| "eval_runtime": 6.178, | |
| "eval_samples_per_second": 526.219, | |
| "eval_steps_per_second": 0.647, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 5.8, | |
| "eval_accuracy": 0.9924457770336046, | |
| "eval_f1": 0.9560485558811219, | |
| "eval_loss": 0.03838498517870903, | |
| "eval_precision": 0.9511910711311011, | |
| "eval_recall": 0.9609559071019859, | |
| "eval_runtime": 6.3664, | |
| "eval_samples_per_second": 510.65, | |
| "eval_steps_per_second": 0.628, | |
| "step": 1275 | |
| }, | |
| { | |
| "epoch": 5.91, | |
| "eval_accuracy": 0.9924068377399634, | |
| "eval_f1": 0.9571045576407506, | |
| "eval_loss": 0.03946718946099281, | |
| "eval_precision": 0.9529529529529529, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.1196, | |
| "eval_samples_per_second": 531.242, | |
| "eval_steps_per_second": 0.654, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 6.02, | |
| "eval_accuracy": 0.9919200965694482, | |
| "eval_f1": 0.9533869885982562, | |
| "eval_loss": 0.04075756296515465, | |
| "eval_precision": 0.9498830604744404, | |
| "eval_recall": 0.9569168630090878, | |
| "eval_runtime": 6.1927, | |
| "eval_samples_per_second": 524.974, | |
| "eval_steps_per_second": 0.646, | |
| "step": 1325 | |
| }, | |
| { | |
| "epoch": 6.14, | |
| "eval_accuracy": 0.9921732019781161, | |
| "eval_f1": 0.9547998997409975, | |
| "eval_loss": 0.04120802879333496, | |
| "eval_precision": 0.948067031690725, | |
| "eval_recall": 0.9616290811174689, | |
| "eval_runtime": 6.3552, | |
| "eval_samples_per_second": 511.548, | |
| "eval_steps_per_second": 0.629, | |
| "step": 1350 | |
| }, | |
| { | |
| "epoch": 6.25, | |
| "eval_accuracy": 0.9923873680931428, | |
| "eval_f1": 0.9555667337357477, | |
| "eval_loss": 0.0413355678319931, | |
| "eval_precision": 0.952054794520548, | |
| "eval_recall": 0.9591046785594076, | |
| "eval_runtime": 6.2847, | |
| "eval_samples_per_second": 517.288, | |
| "eval_steps_per_second": 0.636, | |
| "step": 1375 | |
| }, | |
| { | |
| "epoch": 6.36, | |
| "eval_accuracy": 0.9917448697480628, | |
| "eval_f1": 0.9525004181301221, | |
| "eval_loss": 0.04124680161476135, | |
| "eval_precision": 0.9466422872340425, | |
| "eval_recall": 0.9584315045439246, | |
| "eval_runtime": 6.4524, | |
| "eval_samples_per_second": 503.841, | |
| "eval_steps_per_second": 0.62, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 6.48, | |
| "eval_accuracy": 0.9920953233908337, | |
| "eval_f1": 0.9555611348229978, | |
| "eval_loss": 0.040540654212236404, | |
| "eval_precision": 0.9503912102547029, | |
| "eval_recall": 0.9607876135981152, | |
| "eval_runtime": 6.1266, | |
| "eval_samples_per_second": 530.638, | |
| "eval_steps_per_second": 0.653, | |
| "step": 1425 | |
| }, | |
| { | |
| "epoch": 6.59, | |
| "eval_accuracy": 0.9925041859740664, | |
| "eval_f1": 0.9565508580996233, | |
| "eval_loss": 0.04004018381237984, | |
| "eval_precision": 0.9516908212560387, | |
| "eval_recall": 0.9614607876135981, | |
| "eval_runtime": 6.4161, | |
| "eval_samples_per_second": 506.697, | |
| "eval_steps_per_second": 0.623, | |
| "step": 1450 | |
| }, | |
| { | |
| "epoch": 6.7, | |
| "eval_accuracy": 0.9922900198590398, | |
| "eval_f1": 0.9551813688531458, | |
| "eval_loss": 0.039815619587898254, | |
| "eval_precision": 0.9509591326105088, | |
| "eval_recall": 0.9594412655671491, | |
| "eval_runtime": 6.2578, | |
| "eval_samples_per_second": 519.511, | |
| "eval_steps_per_second": 0.639, | |
| "step": 1475 | |
| }, | |
| { | |
| "epoch": 6.82, | |
| "learning_rate": 1.909090909090909e-05, | |
| "loss": 0.0049, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 6.82, | |
| "eval_accuracy": 0.9925431252677076, | |
| "eval_f1": 0.956871283812076, | |
| "eval_loss": 0.03951007500290871, | |
| "eval_precision": 0.9523253875645941, | |
| "eval_recall": 0.9614607876135981, | |
| "eval_runtime": 6.2854, | |
| "eval_samples_per_second": 517.232, | |
| "eval_steps_per_second": 0.636, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 6.93, | |
| "eval_accuracy": 0.9927183520890931, | |
| "eval_f1": 0.9571476397723468, | |
| "eval_loss": 0.03918459266424179, | |
| "eval_precision": 0.952047952047952, | |
| "eval_recall": 0.9623022551329519, | |
| "eval_runtime": 6.1825, | |
| "eval_samples_per_second": 525.837, | |
| "eval_steps_per_second": 0.647, | |
| "step": 1525 | |
| }, | |
| { | |
| "epoch": 7.05, | |
| "eval_accuracy": 0.9923484287995016, | |
| "eval_f1": 0.9551738583996647, | |
| "eval_loss": 0.03897989168763161, | |
| "eval_precision": 0.9511096278992157, | |
| "eval_recall": 0.9592729720632783, | |
| "eval_runtime": 6.0468, | |
| "eval_samples_per_second": 537.641, | |
| "eval_steps_per_second": 0.662, | |
| "step": 1550 | |
| }, | |
| { | |
| "epoch": 7.16, | |
| "eval_accuracy": 0.9925431252677076, | |
| "eval_f1": 0.9565363034921699, | |
| "eval_loss": 0.03931865468621254, | |
| "eval_precision": 0.9519919986664445, | |
| "eval_recall": 0.9611242006058566, | |
| "eval_runtime": 6.2528, | |
| "eval_samples_per_second": 519.93, | |
| "eval_steps_per_second": 0.64, | |
| "step": 1575 | |
| }, | |
| { | |
| "epoch": 7.27, | |
| "eval_accuracy": 0.9925236556208871, | |
| "eval_f1": 0.9562233196618398, | |
| "eval_loss": 0.03892602398991585, | |
| "eval_precision": 0.9512073272273106, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.0818, | |
| "eval_samples_per_second": 534.544, | |
| "eval_steps_per_second": 0.658, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 7.39, | |
| "eval_accuracy": 0.9923678984463222, | |
| "eval_f1": 0.9565435820145692, | |
| "eval_loss": 0.0404973067343235, | |
| "eval_precision": 0.9518413597733711, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.1086, | |
| "eval_samples_per_second": 532.197, | |
| "eval_steps_per_second": 0.655, | |
| "step": 1625 | |
| }, | |
| { | |
| "epoch": 7.5, | |
| "eval_accuracy": 0.9924847163272458, | |
| "eval_f1": 0.9558737335677803, | |
| "eval_loss": 0.04104885458946228, | |
| "eval_precision": 0.9511748041993001, | |
| "eval_recall": 0.9606193200942443, | |
| "eval_runtime": 6.3603, | |
| "eval_samples_per_second": 511.14, | |
| "eval_steps_per_second": 0.629, | |
| "step": 1650 | |
| }, | |
| { | |
| "epoch": 7.61, | |
| "eval_accuracy": 0.9925431252677076, | |
| "eval_f1": 0.9569442117607639, | |
| "eval_loss": 0.04079214483499527, | |
| "eval_precision": 0.95263509006004, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.0876, | |
| "eval_samples_per_second": 534.04, | |
| "eval_steps_per_second": 0.657, | |
| "step": 1675 | |
| }, | |
| { | |
| "epoch": 7.73, | |
| "eval_accuracy": 0.9921732019781161, | |
| "eval_f1": 0.9545302574389837, | |
| "eval_loss": 0.043598320335149765, | |
| "eval_precision": 0.9481899701095982, | |
| "eval_recall": 0.9609559071019859, | |
| "eval_runtime": 6.3314, | |
| "eval_samples_per_second": 513.469, | |
| "eval_steps_per_second": 0.632, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 7.84, | |
| "eval_accuracy": 0.9924068377399634, | |
| "eval_f1": 0.9559548683660676, | |
| "eval_loss": 0.0419035442173481, | |
| "eval_precision": 0.9495268138801262, | |
| "eval_recall": 0.9624705486368226, | |
| "eval_runtime": 6.237, | |
| "eval_samples_per_second": 521.246, | |
| "eval_steps_per_second": 0.641, | |
| "step": 1725 | |
| }, | |
| { | |
| "epoch": 7.95, | |
| "eval_accuracy": 0.9925625949145283, | |
| "eval_f1": 0.957126109529392, | |
| "eval_loss": 0.04293340817093849, | |
| "eval_precision": 0.9525, | |
| "eval_recall": 0.9617973746213396, | |
| "eval_runtime": 6.1487, | |
| "eval_samples_per_second": 528.734, | |
| "eval_steps_per_second": 0.651, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 8.07, | |
| "eval_accuracy": 0.9924068377399634, | |
| "eval_f1": 0.9561506276150629, | |
| "eval_loss": 0.041886329650878906, | |
| "eval_precision": 0.9508988015978695, | |
| "eval_recall": 0.9614607876135981, | |
| "eval_runtime": 6.3754, | |
| "eval_samples_per_second": 509.93, | |
| "eval_steps_per_second": 0.627, | |
| "step": 1775 | |
| }, | |
| { | |
| "epoch": 8.18, | |
| "eval_accuracy": 0.9922900198590398, | |
| "eval_f1": 0.9555313625324512, | |
| "eval_loss": 0.04220963269472122, | |
| "eval_precision": 0.9509918319719953, | |
| "eval_recall": 0.9601144395826321, | |
| "eval_runtime": 6.1129, | |
| "eval_samples_per_second": 531.828, | |
| "eval_steps_per_second": 0.654, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 8.3, | |
| "eval_accuracy": 0.9923873680931428, | |
| "eval_f1": 0.9561793045664014, | |
| "eval_loss": 0.041702426970005035, | |
| "eval_precision": 0.9521107959285834, | |
| "eval_recall": 0.9602827330865029, | |
| "eval_runtime": 6.3543, | |
| "eval_samples_per_second": 511.618, | |
| "eval_steps_per_second": 0.629, | |
| "step": 1825 | |
| }, | |
| { | |
| "epoch": 8.41, | |
| "eval_accuracy": 0.9924652466804252, | |
| "eval_f1": 0.9570171763720151, | |
| "eval_loss": 0.04150727763772011, | |
| "eval_precision": 0.952945102619723, | |
| "eval_recall": 0.9611242006058566, | |
| "eval_runtime": 6.1032, | |
| "eval_samples_per_second": 532.671, | |
| "eval_steps_per_second": 0.655, | |
| "step": 1850 | |
| }, | |
| { | |
| "epoch": 8.52, | |
| "eval_accuracy": 0.9924263073867841, | |
| "eval_f1": 0.9566965407488064, | |
| "eval_loss": 0.04162871465086937, | |
| "eval_precision": 0.952309488077372, | |
| "eval_recall": 0.9611242006058566, | |
| "eval_runtime": 6.1162, | |
| "eval_samples_per_second": 531.542, | |
| "eval_steps_per_second": 0.654, | |
| "step": 1875 | |
| }, | |
| { | |
| "epoch": 8.64, | |
| "eval_accuracy": 0.9922316109185779, | |
| "eval_f1": 0.9555611348229978, | |
| "eval_loss": 0.04189736768603325, | |
| "eval_precision": 0.9503912102547029, | |
| "eval_recall": 0.9607876135981152, | |
| "eval_runtime": 6.4808, | |
| "eval_samples_per_second": 501.634, | |
| "eval_steps_per_second": 0.617, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 8.75, | |
| "eval_accuracy": 0.9923873680931428, | |
| "eval_f1": 0.9564489112227805, | |
| "eval_loss": 0.04165585711598396, | |
| "eval_precision": 0.9519839946648883, | |
| "eval_recall": 0.9609559071019859, | |
| "eval_runtime": 6.2132, | |
| "eval_samples_per_second": 523.242, | |
| "eval_steps_per_second": 0.644, | |
| "step": 1925 | |
| }, | |
| { | |
| "epoch": 8.86, | |
| "eval_accuracy": 0.9926015342081694, | |
| "eval_f1": 0.9577818730105546, | |
| "eval_loss": 0.041886311024427414, | |
| "eval_precision": 0.9534689793195463, | |
| "eval_recall": 0.9621339616290812, | |
| "eval_runtime": 6.5243, | |
| "eval_samples_per_second": 498.291, | |
| "eval_steps_per_second": 0.613, | |
| "step": 1950 | |
| }, | |
| { | |
| "epoch": 8.98, | |
| "eval_accuracy": 0.9926599431486313, | |
| "eval_f1": 0.9575341318368372, | |
| "eval_loss": 0.04215257614850998, | |
| "eval_precision": 0.9531432382858096, | |
| "eval_recall": 0.9619656681252103, | |
| "eval_runtime": 6.2104, | |
| "eval_samples_per_second": 523.476, | |
| "eval_steps_per_second": 0.644, | |
| "step": 1975 | |
| }, | |
| { | |
| "epoch": 9.09, | |
| "learning_rate": 5.4545454545454545e-06, | |
| "loss": 0.0022, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 9.09, | |
| "eval_accuracy": 0.9925820645613489, | |
| "eval_f1": 0.9571847507331379, | |
| "eval_loss": 0.04227477312088013, | |
| "eval_precision": 0.953111963957951, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.1893, | |
| "eval_samples_per_second": 525.265, | |
| "eval_steps_per_second": 0.646, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 9.2, | |
| "eval_accuracy": 0.9925431252677076, | |
| "eval_f1": 0.9567110441262665, | |
| "eval_loss": 0.042577099055051804, | |
| "eval_precision": 0.9520079986668889, | |
| "eval_recall": 0.9614607876135981, | |
| "eval_runtime": 6.2434, | |
| "eval_samples_per_second": 520.71, | |
| "eval_steps_per_second": 0.641, | |
| "step": 2025 | |
| }, | |
| { | |
| "epoch": 9.32, | |
| "eval_accuracy": 0.9924652466804252, | |
| "eval_f1": 0.9560338330123105, | |
| "eval_loss": 0.04250513017177582, | |
| "eval_precision": 0.9514919153192198, | |
| "eval_recall": 0.9606193200942443, | |
| "eval_runtime": 5.9913, | |
| "eval_samples_per_second": 542.619, | |
| "eval_steps_per_second": 0.668, | |
| "step": 2050 | |
| }, | |
| { | |
| "epoch": 9.43, | |
| "eval_accuracy": 0.9925431252677076, | |
| "eval_f1": 0.956463496316142, | |
| "eval_loss": 0.0422191396355629, | |
| "eval_precision": 0.951682772409197, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.2812, | |
| "eval_samples_per_second": 517.58, | |
| "eval_steps_per_second": 0.637, | |
| "step": 2075 | |
| }, | |
| { | |
| "epoch": 9.55, | |
| "eval_accuracy": 0.9924847163272458, | |
| "eval_f1": 0.9559537765868363, | |
| "eval_loss": 0.0423436276614666, | |
| "eval_precision": 0.9513333333333334, | |
| "eval_recall": 0.9606193200942443, | |
| "eval_runtime": 6.0529, | |
| "eval_samples_per_second": 537.095, | |
| "eval_steps_per_second": 0.661, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 9.66, | |
| "eval_accuracy": 0.9924652466804252, | |
| "eval_f1": 0.9558663428523575, | |
| "eval_loss": 0.04235740005970001, | |
| "eval_precision": 0.951325220870145, | |
| "eval_recall": 0.9604510265903736, | |
| "eval_runtime": 6.0731, | |
| "eval_samples_per_second": 535.315, | |
| "eval_steps_per_second": 0.659, | |
| "step": 2125 | |
| }, | |
| { | |
| "epoch": 9.77, | |
| "eval_accuracy": 0.9924652466804252, | |
| "eval_f1": 0.9566164154103852, | |
| "eval_loss": 0.042295120656490326, | |
| "eval_precision": 0.9521507169056352, | |
| "eval_recall": 0.9611242006058566, | |
| "eval_runtime": 6.3348, | |
| "eval_samples_per_second": 513.197, | |
| "eval_steps_per_second": 0.631, | |
| "step": 2150 | |
| }, | |
| { | |
| "epoch": 9.89, | |
| "eval_accuracy": 0.9924847163272458, | |
| "eval_f1": 0.9567037936521229, | |
| "eval_loss": 0.04226445034146309, | |
| "eval_precision": 0.9521586931155193, | |
| "eval_recall": 0.9612924941097274, | |
| "eval_runtime": 6.1145, | |
| "eval_samples_per_second": 531.688, | |
| "eval_steps_per_second": 0.654, | |
| "step": 2175 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.9925236556208871, | |
| "eval_f1": 0.9570387739720292, | |
| "eval_loss": 0.04224075376987457, | |
| "eval_precision": 0.952492082013669, | |
| "eval_recall": 0.9616290811174689, | |
| "eval_runtime": 6.3677, | |
| "eval_samples_per_second": 510.543, | |
| "eval_steps_per_second": 0.628, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 2200, | |
| "total_flos": 4144211411102244.0, | |
| "train_loss": 0.021953743980689482, | |
| "train_runtime": 1324.4932, | |
| "train_samples_per_second": 106.018, | |
| "train_steps_per_second": 1.661 | |
| } | |
| ], | |
| "max_steps": 2200, | |
| "num_train_epochs": 10, | |
| "total_flos": 4144211411102244.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |