| { | |
| "best_metric": 0.6934678744913757, | |
| "best_model_checkpoint": "sloberta_sentinews_sentence_2e-05_10e_lr2e-05/checkpoint-3560", | |
| "epoch": 2.9966329966329965, | |
| "global_step": 3560, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.03, | |
| "learning_rate": 1.9932659932659936e-05, | |
| "loss": 0.9684, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "eval_accuracy": 0.5901716992303138, | |
| "eval_f1_macro": 0.3290637211523573, | |
| "eval_f1_negative": 0.25811001410437234, | |
| "eval_f1_neutral": 0.7290811493526997, | |
| "eval_f1_positive": 0.0, | |
| "eval_loss": 0.9020117521286011, | |
| "eval_precision_negative": 0.6455026455026455, | |
| "eval_precision_neutral": 0.5861893881695862, | |
| "eval_precision_positive": 0.0, | |
| "eval_recall_negative": 0.16130453944468928, | |
| "eval_recall_neutral": 0.9640918580375782, | |
| "eval_recall_positive": 0.0, | |
| "eval_runtime": 13.6446, | |
| "eval_samples_per_second": 618.928, | |
| "eval_steps_per_second": 3.225, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 0.07, | |
| "learning_rate": 1.9865319865319866e-05, | |
| "loss": 0.8398, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 0.07, | |
| "eval_accuracy": 0.6470100651272943, | |
| "eval_f1_macro": 0.5536698584230076, | |
| "eval_f1_negative": 0.5115520521880946, | |
| "eval_f1_neutral": 0.7385869565217391, | |
| "eval_f1_positive": 0.4108705665591893, | |
| "eval_loss": 0.7759891152381897, | |
| "eval_precision_negative": 0.6673758865248227, | |
| "eval_precision_neutral": 0.65232, | |
| "eval_precision_positive": 0.5681528662420382, | |
| "eval_recall_negative": 0.41472014103129134, | |
| "eval_recall_neutral": 0.8511482254697286, | |
| "eval_recall_positive": 0.3217893217893218, | |
| "eval_runtime": 13.475, | |
| "eval_samples_per_second": 626.715, | |
| "eval_steps_per_second": 3.265, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "learning_rate": 1.97979797979798e-05, | |
| "loss": 0.7748, | |
| "step": 120 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "eval_accuracy": 0.6824156305506217, | |
| "eval_f1_macro": 0.6410968890440648, | |
| "eval_f1_negative": 0.6465890942276981, | |
| "eval_f1_neutral": 0.7394423944239442, | |
| "eval_f1_positive": 0.5372591784805524, | |
| "eval_loss": 0.7227517366409302, | |
| "eval_precision_negative": 0.6702932828760644, | |
| "eval_precision_neutral": 0.7263391059202577, | |
| "eval_precision_positive": 0.5413919413919414, | |
| "eval_recall_negative": 0.624504186866461, | |
| "eval_recall_neutral": 0.753027139874739, | |
| "eval_recall_positive": 0.5331890331890332, | |
| "eval_runtime": 13.5517, | |
| "eval_samples_per_second": 623.169, | |
| "eval_steps_per_second": 3.247, | |
| "step": 120 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "learning_rate": 1.973063973063973e-05, | |
| "loss": 0.7661, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "eval_accuracy": 0.6966252220248668, | |
| "eval_f1_macro": 0.6402639165706846, | |
| "eval_f1_negative": 0.6606451612903226, | |
| "eval_f1_neutral": 0.755861518507433, | |
| "eval_f1_positive": 0.5042850699142984, | |
| "eval_loss": 0.6990944147109985, | |
| "eval_precision_negative": 0.6451070978580429, | |
| "eval_precision_neutral": 0.7238677622778521, | |
| "eval_precision_positive": 0.6726835138387485, | |
| "eval_recall_negative": 0.6769501983252534, | |
| "eval_recall_neutral": 0.7908141962421712, | |
| "eval_recall_positive": 0.4033189033189033, | |
| "eval_runtime": 13.529, | |
| "eval_samples_per_second": 624.216, | |
| "eval_steps_per_second": 3.252, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "learning_rate": 1.9663299663299665e-05, | |
| "loss": 0.7329, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "eval_accuracy": 0.6814683244523386, | |
| "eval_f1_macro": 0.6584553155124641, | |
| "eval_f1_negative": 0.6805819101834283, | |
| "eval_f1_neutral": 0.7180338757887746, | |
| "eval_f1_positive": 0.5767501605651895, | |
| "eval_loss": 0.7035245299339294, | |
| "eval_precision_negative": 0.6523848019401779, | |
| "eval_precision_neutral": 0.7643176997407495, | |
| "eval_precision_positive": 0.5196759259259259, | |
| "eval_recall_negative": 0.7113265755839577, | |
| "eval_recall_neutral": 0.677035490605428, | |
| "eval_recall_positive": 0.6479076479076479, | |
| "eval_runtime": 13.5578, | |
| "eval_samples_per_second": 622.89, | |
| "eval_steps_per_second": 3.245, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.2, | |
| "learning_rate": 1.9595959595959596e-05, | |
| "loss": 0.7084, | |
| "step": 240 | |
| }, | |
| { | |
| "epoch": 0.2, | |
| "eval_accuracy": 0.7044404973357016, | |
| "eval_f1_macro": 0.6484202003006585, | |
| "eval_f1_negative": 0.6737166776823088, | |
| "eval_f1_neutral": 0.7610199644198458, | |
| "eval_f1_positive": 0.5105239587998209, | |
| "eval_loss": 0.6696082353591919, | |
| "eval_precision_negative": 0.673568281938326, | |
| "eval_precision_neutral": 0.7225975975975976, | |
| "eval_precision_positive": 0.6729634002361276, | |
| "eval_recall_negative": 0.6738651388276774, | |
| "eval_recall_neutral": 0.8037578288100209, | |
| "eval_recall_positive": 0.41125541125541126, | |
| "eval_runtime": 13.468, | |
| "eval_samples_per_second": 627.04, | |
| "eval_steps_per_second": 3.267, | |
| "step": 240 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "learning_rate": 1.952861952861953e-05, | |
| "loss": 0.6878, | |
| "step": 280 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "eval_accuracy": 0.6889283599763173, | |
| "eval_f1_macro": 0.6646815029633141, | |
| "eval_f1_negative": 0.6859417557091976, | |
| "eval_f1_neutral": 0.7256559446701065, | |
| "eval_f1_positive": 0.5824468085106382, | |
| "eval_loss": 0.6821370720863342, | |
| "eval_precision_negative": 0.6537539936102237, | |
| "eval_precision_neutral": 0.7652234313498495, | |
| "eval_precision_positive": 0.5400739827373613, | |
| "eval_recall_negative": 0.7214631996474218, | |
| "eval_recall_neutral": 0.6899791231732777, | |
| "eval_recall_positive": 0.6320346320346321, | |
| "eval_runtime": 13.4239, | |
| "eval_samples_per_second": 629.1, | |
| "eval_steps_per_second": 3.278, | |
| "step": 280 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "learning_rate": 1.9461279461279464e-05, | |
| "loss": 0.7059, | |
| "step": 320 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "eval_accuracy": 0.7119005328596802, | |
| "eval_f1_macro": 0.6649492798540481, | |
| "eval_f1_negative": 0.6837046745303625, | |
| "eval_f1_neutral": 0.763837267704671, | |
| "eval_f1_positive": 0.5473058973271108, | |
| "eval_loss": 0.662620484828949, | |
| "eval_precision_negative": 0.6777825898657427, | |
| "eval_precision_neutral": 0.736108422071636, | |
| "eval_precision_positive": 0.6642636457260556, | |
| "eval_recall_negative": 0.6897311591009255, | |
| "eval_recall_neutral": 0.7937369519832985, | |
| "eval_recall_positive": 0.4653679653679654, | |
| "eval_runtime": 13.4494, | |
| "eval_samples_per_second": 627.911, | |
| "eval_steps_per_second": 3.272, | |
| "step": 320 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "learning_rate": 1.9393939393939395e-05, | |
| "loss": 0.6745, | |
| "step": 360 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "eval_accuracy": 0.709295441089402, | |
| "eval_f1_macro": 0.6599969904410593, | |
| "eval_f1_negative": 0.6773485513608428, | |
| "eval_f1_neutral": 0.7627118644067796, | |
| "eval_f1_positive": 0.5399305555555556, | |
| "eval_loss": 0.6554310917854309, | |
| "eval_precision_negative": 0.674682990817665, | |
| "eval_precision_neutral": 0.7299618320610687, | |
| "eval_precision_positive": 0.6775599128540305, | |
| "eval_recall_negative": 0.6800352578228295, | |
| "eval_recall_neutral": 0.7985386221294363, | |
| "eval_recall_positive": 0.44877344877344877, | |
| "eval_runtime": 13.4392, | |
| "eval_samples_per_second": 628.385, | |
| "eval_steps_per_second": 3.274, | |
| "step": 360 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "learning_rate": 1.932659932659933e-05, | |
| "loss": 0.6824, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "eval_accuracy": 0.7095322676139728, | |
| "eval_f1_macro": 0.6638552526690601, | |
| "eval_f1_negative": 0.6730469619407968, | |
| "eval_f1_neutral": 0.7641443071048136, | |
| "eval_f1_positive": 0.5543744889615698, | |
| "eval_loss": 0.6521803736686707, | |
| "eval_precision_negative": 0.6798561151079137, | |
| "eval_precision_neutral": 0.7366789381902732, | |
| "eval_precision_positive": 0.6396226415094339, | |
| "eval_recall_negative": 0.6663728514764213, | |
| "eval_recall_neutral": 0.7937369519832985, | |
| "eval_recall_positive": 0.48917748917748916, | |
| "eval_runtime": 13.4346, | |
| "eval_samples_per_second": 628.599, | |
| "eval_steps_per_second": 3.275, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "learning_rate": 1.925925925925926e-05, | |
| "loss": 0.669, | |
| "step": 440 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "eval_accuracy": 0.713084665482534, | |
| "eval_f1_macro": 0.6622007799006476, | |
| "eval_f1_negative": 0.6819873057561829, | |
| "eval_f1_neutral": 0.7671314741035858, | |
| "eval_f1_positive": 0.5374835598421743, | |
| "eval_loss": 0.6492008566856384, | |
| "eval_precision_negative": 0.6773913043478261, | |
| "eval_precision_neutral": 0.7335238095238096, | |
| "eval_precision_positive": 0.6849162011173184, | |
| "eval_recall_negative": 0.6866460996033495, | |
| "eval_recall_neutral": 0.8039665970772443, | |
| "eval_recall_positive": 0.4422799422799423, | |
| "eval_runtime": 13.4531, | |
| "eval_samples_per_second": 627.738, | |
| "eval_steps_per_second": 3.271, | |
| "step": 440 | |
| }, | |
| { | |
| "epoch": 0.4, | |
| "learning_rate": 1.9191919191919194e-05, | |
| "loss": 0.6835, | |
| "step": 480 | |
| }, | |
| { | |
| "epoch": 0.4, | |
| "eval_accuracy": 0.7045589105979869, | |
| "eval_f1_macro": 0.6620625908815416, | |
| "eval_f1_negative": 0.6357811729916215, | |
| "eval_f1_neutral": 0.7631345490389355, | |
| "eval_f1_positive": 0.5872720506140677, | |
| "eval_loss": 0.6506330966949463, | |
| "eval_precision_negative": 0.7210732252655114, | |
| "eval_precision_neutral": 0.722875816993464, | |
| "eval_precision_positive": 0.606456571867794, | |
| "eval_recall_negative": 0.5685323931247246, | |
| "eval_recall_neutral": 0.8081419624217119, | |
| "eval_recall_positive": 0.5692640692640693, | |
| "eval_runtime": 13.434, | |
| "eval_samples_per_second": 628.63, | |
| "eval_steps_per_second": 3.275, | |
| "step": 480 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "learning_rate": 1.9124579124579125e-05, | |
| "loss": 0.659, | |
| "step": 520 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_accuracy": 0.7040852575488454, | |
| "eval_f1_macro": 0.6783997964045833, | |
| "eval_f1_negative": 0.699721226602947, | |
| "eval_f1_neutral": 0.7399162442142384, | |
| "eval_f1_positive": 0.595561918396564, | |
| "eval_loss": 0.6650780439376831, | |
| "eval_precision_negative": 0.6382128586996004, | |
| "eval_precision_neutral": 0.7836134453781513, | |
| "eval_precision_positive": 0.5909090909090909, | |
| "eval_recall_negative": 0.7743499338915822, | |
| "eval_recall_neutral": 0.7008350730688935, | |
| "eval_recall_positive": 0.6002886002886003, | |
| "eval_runtime": 13.4366, | |
| "eval_samples_per_second": 628.508, | |
| "eval_steps_per_second": 3.275, | |
| "step": 520 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "learning_rate": 1.905723905723906e-05, | |
| "loss": 0.6554, | |
| "step": 560 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "eval_accuracy": 0.7166370633510953, | |
| "eval_f1_macro": 0.6722586905255515, | |
| "eval_f1_negative": 0.6801165657924232, | |
| "eval_f1_neutral": 0.7694463910301331, | |
| "eval_f1_positive": 0.5672131147540983, | |
| "eval_loss": 0.6467012763023376, | |
| "eval_precision_negative": 0.6920620437956204, | |
| "eval_precision_neutral": 0.7391806116560877, | |
| "eval_precision_positive": 0.6565464895635673, | |
| "eval_recall_negative": 0.6685764654032613, | |
| "eval_recall_neutral": 0.8022964509394572, | |
| "eval_recall_positive": 0.49927849927849927, | |
| "eval_runtime": 13.4494, | |
| "eval_samples_per_second": 627.909, | |
| "eval_steps_per_second": 3.272, | |
| "step": 560 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "learning_rate": 1.8989898989898993e-05, | |
| "loss": 0.659, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "eval_accuracy": 0.712137359384251, | |
| "eval_f1_macro": 0.6705187144410446, | |
| "eval_f1_negative": 0.6719478098788444, | |
| "eval_f1_neutral": 0.7654419861848032, | |
| "eval_f1_positive": 0.5741663472594865, | |
| "eval_loss": 0.6443530917167664, | |
| "eval_precision_negative": 0.71280276816609, | |
| "eval_precision_neutral": 0.7353337180226966, | |
| "eval_precision_positive": 0.6124284546197875, | |
| "eval_recall_negative": 0.6355222565006611, | |
| "eval_recall_neutral": 0.7981210855949895, | |
| "eval_recall_positive": 0.5404040404040404, | |
| "eval_runtime": 13.4345, | |
| "eval_samples_per_second": 628.604, | |
| "eval_steps_per_second": 3.275, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "learning_rate": 1.8922558922558924e-05, | |
| "loss": 0.6692, | |
| "step": 640 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "eval_accuracy": 0.7047957371225577, | |
| "eval_f1_macro": 0.6746517865902923, | |
| "eval_f1_negative": 0.6761710794297353, | |
| "eval_f1_neutral": 0.7508104151416919, | |
| "eval_f1_positive": 0.5969738651994497, | |
| "eval_loss": 0.6483765244483948, | |
| "eval_precision_negative": 0.6948837209302325, | |
| "eval_precision_neutral": 0.7521474963335428, | |
| "eval_precision_positive": 0.5703022339027596, | |
| "eval_recall_negative": 0.6584398413397973, | |
| "eval_recall_neutral": 0.7494780793319415, | |
| "eval_recall_positive": 0.6262626262626263, | |
| "eval_runtime": 13.5781, | |
| "eval_samples_per_second": 621.958, | |
| "eval_steps_per_second": 3.241, | |
| "step": 640 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "learning_rate": 1.8855218855218858e-05, | |
| "loss": 0.6343, | |
| "step": 680 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "eval_accuracy": 0.7084665482534044, | |
| "eval_f1_macro": 0.6745823109427566, | |
| "eval_f1_negative": 0.6674407803065491, | |
| "eval_f1_neutral": 0.7580216636010628, | |
| "eval_f1_positive": 0.5982844889206576, | |
| "eval_loss": 0.6420348286628723, | |
| "eval_precision_negative": 0.7054491899852725, | |
| "eval_precision_neutral": 0.7423939151321057, | |
| "eval_precision_positive": 0.5927762039660056, | |
| "eval_recall_negative": 0.6333186425738211, | |
| "eval_recall_neutral": 0.774321503131524, | |
| "eval_recall_positive": 0.6038961038961039, | |
| "eval_runtime": 13.5238, | |
| "eval_samples_per_second": 624.455, | |
| "eval_steps_per_second": 3.254, | |
| "step": 680 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "learning_rate": 1.8787878787878792e-05, | |
| "loss": 0.6707, | |
| "step": 720 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "eval_accuracy": 0.7161634103019539, | |
| "eval_f1_macro": 0.6635859690261697, | |
| "eval_f1_negative": 0.6552984165651644, | |
| "eval_f1_neutral": 0.7757296466973886, | |
| "eval_f1_positive": 0.5597298438159561, | |
| "eval_loss": 0.630727231502533, | |
| "eval_precision_negative": 0.7325708061002179, | |
| "eval_precision_neutral": 0.7180945609669392, | |
| "eval_precision_positive": 0.6744659206510681, | |
| "eval_recall_negative": 0.5927721463199648, | |
| "eval_recall_neutral": 0.8434237995824635, | |
| "eval_recall_positive": 0.47835497835497837, | |
| "eval_runtime": 13.5358, | |
| "eval_samples_per_second": 623.902, | |
| "eval_steps_per_second": 3.251, | |
| "step": 720 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "learning_rate": 1.8720538720538723e-05, | |
| "loss": 0.6555, | |
| "step": 760 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "eval_accuracy": 0.7173475429248076, | |
| "eval_f1_macro": 0.6760934295779212, | |
| "eval_f1_negative": 0.6785469499657298, | |
| "eval_f1_neutral": 0.7685231476852316, | |
| "eval_f1_positive": 0.5812101910828025, | |
| "eval_loss": 0.6327303051948547, | |
| "eval_precision_negative": 0.7044592030360531, | |
| "eval_precision_neutral": 0.7374784110535406, | |
| "eval_precision_positive": 0.6483126110124334, | |
| "eval_recall_negative": 0.6544733362714852, | |
| "eval_recall_neutral": 0.8022964509394572, | |
| "eval_recall_positive": 0.5266955266955267, | |
| "eval_runtime": 13.5283, | |
| "eval_samples_per_second": 624.249, | |
| "eval_steps_per_second": 3.252, | |
| "step": 760 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "learning_rate": 1.8653198653198653e-05, | |
| "loss": 0.6539, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "eval_accuracy": 0.713676731793961, | |
| "eval_f1_macro": 0.6798716085872009, | |
| "eval_f1_negative": 0.6834306241580603, | |
| "eval_f1_neutral": 0.7602507450416196, | |
| "eval_f1_positive": 0.5959334565619224, | |
| "eval_loss": 0.63933926820755, | |
| "eval_precision_negative": 0.6965675057208238, | |
| "eval_precision_neutral": 0.7486338797814208, | |
| "eval_precision_positive": 0.6110689916603488, | |
| "eval_recall_negative": 0.6707800793301014, | |
| "eval_recall_neutral": 0.7722338204592902, | |
| "eval_recall_positive": 0.5815295815295816, | |
| "eval_runtime": 13.556, | |
| "eval_samples_per_second": 622.971, | |
| "eval_steps_per_second": 3.246, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "learning_rate": 1.8585858585858588e-05, | |
| "loss": 0.6586, | |
| "step": 840 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "eval_accuracy": 0.7122557726465364, | |
| "eval_f1_macro": 0.6643997026372683, | |
| "eval_f1_negative": 0.6466569058077111, | |
| "eval_f1_neutral": 0.7709443099273607, | |
| "eval_f1_positive": 0.575597892176733, | |
| "eval_loss": 0.6333789229393005, | |
| "eval_precision_negative": 0.7244395844723893, | |
| "eval_precision_neutral": 0.7190605239385727, | |
| "eval_precision_positive": 0.6567992599444958, | |
| "eval_recall_negative": 0.5839576906126047, | |
| "eval_recall_neutral": 0.8308977035490606, | |
| "eval_recall_positive": 0.5122655122655123, | |
| "eval_runtime": 13.615, | |
| "eval_samples_per_second": 620.272, | |
| "eval_steps_per_second": 3.232, | |
| "step": 840 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "learning_rate": 1.851851851851852e-05, | |
| "loss": 0.6579, | |
| "step": 880 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "eval_accuracy": 0.7187685020722321, | |
| "eval_f1_macro": 0.6807447825123648, | |
| "eval_f1_negative": 0.6873633581110626, | |
| "eval_f1_neutral": 0.7675631455159013, | |
| "eval_f1_positive": 0.5873078439101301, | |
| "eval_loss": 0.6417641639709473, | |
| "eval_precision_negative": 0.6819956616052061, | |
| "eval_precision_neutral": 0.7522549609140108, | |
| "eval_precision_positive": 0.6472632493483927, | |
| "eval_recall_negative": 0.6928162185985015, | |
| "eval_recall_neutral": 0.7835073068893528, | |
| "eval_recall_positive": 0.5375180375180375, | |
| "eval_runtime": 13.429, | |
| "eval_samples_per_second": 628.863, | |
| "eval_steps_per_second": 3.276, | |
| "step": 880 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "learning_rate": 1.8451178451178452e-05, | |
| "loss": 0.6408, | |
| "step": 920 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "eval_accuracy": 0.7156897572528124, | |
| "eval_f1_macro": 0.6733312463576527, | |
| "eval_f1_negative": 0.6765443355368133, | |
| "eval_f1_neutral": 0.7680304091227369, | |
| "eval_f1_positive": 0.5754189944134079, | |
| "eval_loss": 0.6319063901901245, | |
| "eval_precision_negative": 0.7006610009442871, | |
| "eval_precision_neutral": 0.7372767428461686, | |
| "eval_precision_positive": 0.64375, | |
| "eval_recall_negative": 0.6540326134861172, | |
| "eval_recall_neutral": 0.8014613778705637, | |
| "eval_recall_positive": 0.5202020202020202, | |
| "eval_runtime": 13.4319, | |
| "eval_samples_per_second": 628.725, | |
| "eval_steps_per_second": 3.276, | |
| "step": 920 | |
| }, | |
| { | |
| "epoch": 0.81, | |
| "learning_rate": 1.8383838383838387e-05, | |
| "loss": 0.6458, | |
| "step": 960 | |
| }, | |
| { | |
| "epoch": 0.81, | |
| "eval_accuracy": 0.7116637063351096, | |
| "eval_f1_macro": 0.6808189121483205, | |
| "eval_f1_negative": 0.6855624446412755, | |
| "eval_f1_neutral": 0.7558841907935847, | |
| "eval_f1_positive": 0.601010101010101, | |
| "eval_loss": 0.6365010142326355, | |
| "eval_precision_negative": 0.6889185580774366, | |
| "eval_precision_neutral": 0.7541562759767249, | |
| "eval_precision_positive": 0.601010101010101, | |
| "eval_recall_negative": 0.6822388717496695, | |
| "eval_recall_neutral": 0.7576200417536535, | |
| "eval_recall_positive": 0.601010101010101, | |
| "eval_runtime": 13.4342, | |
| "eval_samples_per_second": 628.619, | |
| "eval_steps_per_second": 3.275, | |
| "step": 960 | |
| }, | |
| { | |
| "epoch": 0.84, | |
| "learning_rate": 1.831649831649832e-05, | |
| "loss": 0.6663, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.84, | |
| "eval_accuracy": 0.7177027827116637, | |
| "eval_f1_macro": 0.6745871543495067, | |
| "eval_f1_negative": 0.6834215167548501, | |
| "eval_f1_neutral": 0.7686739720518749, | |
| "eval_f1_positive": 0.5716659742417948, | |
| "eval_loss": 0.6319110989570618, | |
| "eval_precision_negative": 0.6837229819144244, | |
| "eval_precision_neutral": 0.7413224743067675, | |
| "eval_precision_positive": 0.67384916748286, | |
| "eval_recall_negative": 0.6831203173204055, | |
| "eval_recall_neutral": 0.7981210855949895, | |
| "eval_recall_positive": 0.4963924963924964, | |
| "eval_runtime": 13.4422, | |
| "eval_samples_per_second": 628.246, | |
| "eval_steps_per_second": 3.273, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "learning_rate": 1.824915824915825e-05, | |
| "loss": 0.6456, | |
| "step": 1040 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "eval_accuracy": 0.7104795737122558, | |
| "eval_f1_macro": 0.6846884030136478, | |
| "eval_f1_negative": 0.6933867735470942, | |
| "eval_f1_neutral": 0.7508249068653539, | |
| "eval_f1_positive": 0.6098535286284953, | |
| "eval_loss": 0.6414014101028442, | |
| "eval_precision_negative": 0.7007200720072008, | |
| "eval_precision_neutral": 0.7659066232356134, | |
| "eval_precision_positive": 0.5661310259579728, | |
| "eval_recall_negative": 0.6862053768179814, | |
| "eval_recall_neutral": 0.7363256784968685, | |
| "eval_recall_positive": 0.6608946608946609, | |
| "eval_runtime": 13.4341, | |
| "eval_samples_per_second": 628.625, | |
| "eval_steps_per_second": 3.275, | |
| "step": 1040 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "learning_rate": 1.8181818181818182e-05, | |
| "loss": 0.6416, | |
| "step": 1080 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "eval_accuracy": 0.7153345174659562, | |
| "eval_f1_macro": 0.6849725647884108, | |
| "eval_f1_negative": 0.6939308244507288, | |
| "eval_f1_neutral": 0.7585337674614012, | |
| "eval_f1_positive": 0.6024531024531025, | |
| "eval_loss": 0.6341109871864319, | |
| "eval_precision_negative": 0.6851374570446735, | |
| "eval_precision_neutral": 0.7632635806383429, | |
| "eval_precision_positive": 0.6024531024531025, | |
| "eval_recall_negative": 0.7029528426619657, | |
| "eval_recall_neutral": 0.7538622129436325, | |
| "eval_recall_positive": 0.6024531024531025, | |
| "eval_runtime": 13.5517, | |
| "eval_samples_per_second": 623.169, | |
| "eval_steps_per_second": 3.247, | |
| "step": 1080 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "learning_rate": 1.8114478114478116e-05, | |
| "loss": 0.6387, | |
| "step": 1120 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "eval_accuracy": 0.7132030787448195, | |
| "eval_f1_macro": 0.6812920768310707, | |
| "eval_f1_negative": 0.6735266604303087, | |
| "eval_f1_neutral": 0.7610456176319835, | |
| "eval_f1_positive": 0.60930395243092, | |
| "eval_loss": 0.6404346227645874, | |
| "eval_precision_negative": 0.7174887892376681, | |
| "eval_precision_neutral": 0.7476334340382679, | |
| "eval_precision_positive": 0.5913102511880516, | |
| "eval_recall_negative": 0.6346408109299251, | |
| "eval_recall_neutral": 0.7749478079331942, | |
| "eval_recall_positive": 0.6284271284271284, | |
| "eval_runtime": 13.5098, | |
| "eval_samples_per_second": 625.102, | |
| "eval_steps_per_second": 3.257, | |
| "step": 1120 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "learning_rate": 1.804713804713805e-05, | |
| "loss": 0.6483, | |
| "step": 1160 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "eval_accuracy": 0.7200710479573712, | |
| "eval_f1_macro": 0.6806619404824857, | |
| "eval_f1_negative": 0.6825213576541214, | |
| "eval_f1_neutral": 0.7708228674771426, | |
| "eval_f1_positive": 0.5886415963161934, | |
| "eval_loss": 0.6273576021194458, | |
| "eval_precision_negative": 0.7167798254122212, | |
| "eval_precision_neutral": 0.7429788882432694, | |
| "eval_precision_positive": 0.6286885245901639, | |
| "eval_recall_negative": 0.6513882767739092, | |
| "eval_recall_neutral": 0.8008350730688936, | |
| "eval_recall_positive": 0.5533910533910534, | |
| "eval_runtime": 13.5101, | |
| "eval_samples_per_second": 625.087, | |
| "eval_steps_per_second": 3.257, | |
| "step": 1160 | |
| }, | |
| { | |
| "epoch": 1.01, | |
| "learning_rate": 1.797979797979798e-05, | |
| "loss": 0.6418, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 1.01, | |
| "eval_accuracy": 0.7216104203670811, | |
| "eval_f1_macro": 0.6749026822057264, | |
| "eval_f1_negative": 0.6914728682170542, | |
| "eval_f1_neutral": 0.7730991818000399, | |
| "eval_f1_positive": 0.560135996600085, | |
| "eval_loss": 0.6303337812423706, | |
| "eval_precision_negative": 0.695013357079252, | |
| "eval_precision_neutral": 0.7404434250764526, | |
| "eval_precision_positive": 0.6814891416752844, | |
| "eval_recall_negative": 0.6879682679594535, | |
| "eval_recall_neutral": 0.808768267223382, | |
| "eval_recall_positive": 0.4754689754689755, | |
| "eval_runtime": 14.4031, | |
| "eval_samples_per_second": 586.332, | |
| "eval_steps_per_second": 3.055, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 1.04, | |
| "learning_rate": 1.7912457912457915e-05, | |
| "loss": 0.6201, | |
| "step": 1240 | |
| }, | |
| { | |
| "epoch": 1.04, | |
| "eval_accuracy": 0.7193605683836589, | |
| "eval_f1_macro": 0.6783071530429613, | |
| "eval_f1_negative": 0.6780135229657263, | |
| "eval_f1_neutral": 0.7719368378972615, | |
| "eval_f1_positive": 0.584971098265896, | |
| "eval_loss": 0.6306412220001221, | |
| "eval_precision_negative": 0.7198019801980198, | |
| "eval_precision_neutral": 0.7404141104294478, | |
| "eval_precision_positive": 0.6277915632754343, | |
| "eval_recall_negative": 0.6408109299250772, | |
| "eval_recall_neutral": 0.8062630480167015, | |
| "eval_recall_positive": 0.5476190476190477, | |
| "eval_runtime": 13.6129, | |
| "eval_samples_per_second": 620.369, | |
| "eval_steps_per_second": 3.232, | |
| "step": 1240 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "learning_rate": 1.7845117845117846e-05, | |
| "loss": 0.5971, | |
| "step": 1280 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "eval_accuracy": 0.7166370633510953, | |
| "eval_f1_macro": 0.6745910338462799, | |
| "eval_f1_negative": 0.6869394005688033, | |
| "eval_f1_neutral": 0.7662285136501515, | |
| "eval_f1_positive": 0.5706051873198847, | |
| "eval_loss": 0.6360566020011902, | |
| "eval_precision_negative": 0.682015638575152, | |
| "eval_precision_neutral": 0.7429411764705882, | |
| "eval_precision_positive": 0.6644295302013423, | |
| "eval_recall_negative": 0.6919347730277655, | |
| "eval_recall_neutral": 0.7910229645093946, | |
| "eval_recall_positive": 0.5, | |
| "eval_runtime": 13.5493, | |
| "eval_samples_per_second": 623.278, | |
| "eval_steps_per_second": 3.247, | |
| "step": 1280 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "learning_rate": 1.7777777777777777e-05, | |
| "loss": 0.6101, | |
| "step": 1320 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "eval_accuracy": 0.7226761397276495, | |
| "eval_f1_macro": 0.6791712549911954, | |
| "eval_f1_negative": 0.6990124516960068, | |
| "eval_f1_neutral": 0.7709451929895654, | |
| "eval_f1_positive": 0.5675561202880136, | |
| "eval_loss": 0.6358277201652527, | |
| "eval_precision_negative": 0.6814566764336543, | |
| "eval_precision_neutral": 0.748868333005314, | |
| "eval_precision_positive": 0.6871794871794872, | |
| "eval_recall_negative": 0.7174966945791097, | |
| "eval_recall_neutral": 0.7943632567849687, | |
| "eval_recall_positive": 0.4834054834054834, | |
| "eval_runtime": 13.4061, | |
| "eval_samples_per_second": 629.938, | |
| "eval_steps_per_second": 3.282, | |
| "step": 1320 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "learning_rate": 1.771043771043771e-05, | |
| "loss": 0.5977, | |
| "step": 1360 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_accuracy": 0.7124925991711072, | |
| "eval_f1_macro": 0.6812595953156201, | |
| "eval_f1_negative": 0.6902101028162717, | |
| "eval_f1_neutral": 0.756903198916328, | |
| "eval_f1_positive": 0.5966654842142604, | |
| "eval_loss": 0.640369713306427, | |
| "eval_precision_negative": 0.7002267573696145, | |
| "eval_precision_neutral": 0.7555648013313917, | |
| "eval_precision_positive": 0.586880669923238, | |
| "eval_recall_negative": 0.6804759806081975, | |
| "eval_recall_neutral": 0.7582463465553236, | |
| "eval_recall_positive": 0.6067821067821068, | |
| "eval_runtime": 13.458, | |
| "eval_samples_per_second": 627.51, | |
| "eval_steps_per_second": 3.269, | |
| "step": 1360 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "learning_rate": 1.7643097643097645e-05, | |
| "loss": 0.6229, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "eval_accuracy": 0.720307874481942, | |
| "eval_f1_macro": 0.6787577486913711, | |
| "eval_f1_negative": 0.6789838337182449, | |
| "eval_f1_neutral": 0.7721746063384493, | |
| "eval_f1_positive": 0.5851148060174189, | |
| "eval_loss": 0.625924825668335, | |
| "eval_precision_negative": 0.7132459970887919, | |
| "eval_precision_neutral": 0.7387490465293669, | |
| "eval_precision_positive": 0.6482456140350877, | |
| "eval_recall_negative": 0.6478624944909652, | |
| "eval_recall_neutral": 0.808768267223382, | |
| "eval_recall_positive": 0.5331890331890332, | |
| "eval_runtime": 13.413, | |
| "eval_samples_per_second": 629.615, | |
| "eval_steps_per_second": 3.28, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "learning_rate": 1.7575757575757576e-05, | |
| "loss": 0.5971, | |
| "step": 1440 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "eval_accuracy": 0.7111900532859681, | |
| "eval_f1_macro": 0.685070727390424, | |
| "eval_f1_negative": 0.6965195246179966, | |
| "eval_f1_neutral": 0.7495985440530993, | |
| "eval_f1_positive": 0.6090941135001762, | |
| "eval_loss": 0.6486834287643433, | |
| "eval_precision_negative": 0.6717151043798608, | |
| "eval_precision_neutral": 0.7692814765985497, | |
| "eval_precision_positive": 0.5954514128187457, | |
| "eval_recall_negative": 0.7232260907888938, | |
| "eval_recall_neutral": 0.7308977035490606, | |
| "eval_recall_positive": 0.6233766233766234, | |
| "eval_runtime": 13.4217, | |
| "eval_samples_per_second": 629.204, | |
| "eval_steps_per_second": 3.278, | |
| "step": 1440 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "learning_rate": 1.750841750841751e-05, | |
| "loss": 0.6006, | |
| "step": 1480 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "eval_accuracy": 0.7155713439905269, | |
| "eval_f1_macro": 0.683204217410409, | |
| "eval_f1_negative": 0.6757380073800737, | |
| "eval_f1_neutral": 0.7631821439541312, | |
| "eval_f1_positive": 0.6106925008970219, | |
| "eval_loss": 0.6353930830955505, | |
| "eval_precision_negative": 0.7087566521528785, | |
| "eval_precision_neutral": 0.7488446855535463, | |
| "eval_precision_positive": 0.6074232690935046, | |
| "eval_recall_negative": 0.6456588805641251, | |
| "eval_recall_neutral": 0.7780793319415449, | |
| "eval_recall_positive": 0.613997113997114, | |
| "eval_runtime": 13.4559, | |
| "eval_samples_per_second": 627.605, | |
| "eval_steps_per_second": 3.27, | |
| "step": 1480 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "learning_rate": 1.7441077441077444e-05, | |
| "loss": 0.6104, | |
| "step": 1520 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "eval_accuracy": 0.7127294256956779, | |
| "eval_f1_macro": 0.6839464489013288, | |
| "eval_f1_negative": 0.6825213576541214, | |
| "eval_f1_neutral": 0.7576642335766423, | |
| "eval_f1_positive": 0.6116537554732233, | |
| "eval_loss": 0.6454949975013733, | |
| "eval_precision_negative": 0.7167798254122212, | |
| "eval_precision_neutral": 0.756875, | |
| "eval_precision_positive": 0.5735944409349337, | |
| "eval_recall_negative": 0.6513882767739092, | |
| "eval_recall_neutral": 0.758455114822547, | |
| "eval_recall_positive": 0.6551226551226551, | |
| "eval_runtime": 13.4867, | |
| "eval_samples_per_second": 626.174, | |
| "eval_steps_per_second": 3.262, | |
| "step": 1520 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "learning_rate": 1.7373737373737375e-05, | |
| "loss": 0.6101, | |
| "step": 1560 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "eval_accuracy": 0.7206631142687981, | |
| "eval_f1_macro": 0.6779869326137852, | |
| "eval_f1_negative": 0.6807543740059078, | |
| "eval_f1_neutral": 0.772482552342971, | |
| "eval_f1_positive": 0.5807238714924766, | |
| "eval_loss": 0.6268090605735779, | |
| "eval_precision_negative": 0.702626641651032, | |
| "eval_precision_neutral": 0.7393129770992366, | |
| "eval_precision_positive": 0.6654240447343895, | |
| "eval_recall_negative": 0.6602027324812693, | |
| "eval_recall_neutral": 0.808768267223382, | |
| "eval_recall_positive": 0.5151515151515151, | |
| "eval_runtime": 13.4458, | |
| "eval_samples_per_second": 628.077, | |
| "eval_steps_per_second": 3.272, | |
| "step": 1560 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "learning_rate": 1.7306397306397305e-05, | |
| "loss": 0.6022, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "eval_accuracy": 0.7143872113676731, | |
| "eval_f1_macro": 0.6836129674253361, | |
| "eval_f1_negative": 0.6836007130124777, | |
| "eval_f1_neutral": 0.7594515995014541, | |
| "eval_f1_positive": 0.6077865897620764, | |
| "eval_loss": 0.6394125819206238, | |
| "eval_precision_negative": 0.6913023884632717, | |
| "eval_precision_neutral": 0.7556841670111616, | |
| "eval_precision_positive": 0.6073487031700289, | |
| "eval_recall_negative": 0.6760687527545174, | |
| "eval_recall_neutral": 0.7632567849686848, | |
| "eval_recall_positive": 0.6082251082251082, | |
| "eval_runtime": 13.4382, | |
| "eval_samples_per_second": 628.432, | |
| "eval_steps_per_second": 3.274, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "learning_rate": 1.723905723905724e-05, | |
| "loss": 0.6236, | |
| "step": 1640 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "eval_accuracy": 0.7134399052693902, | |
| "eval_f1_macro": 0.6861857480530462, | |
| "eval_f1_negative": 0.683572710951526, | |
| "eval_f1_neutral": 0.7565409267626353, | |
| "eval_f1_positive": 0.6184436064449776, | |
| "eval_loss": 0.6394263505935669, | |
| "eval_precision_negative": 0.6963877457704618, | |
| "eval_precision_neutral": 0.7615823989845568, | |
| "eval_precision_positive": 0.589157413455258, | |
| "eval_recall_negative": 0.6712208021154694, | |
| "eval_recall_neutral": 0.7515657620041754, | |
| "eval_recall_positive": 0.6507936507936508, | |
| "eval_runtime": 13.4189, | |
| "eval_samples_per_second": 629.337, | |
| "eval_steps_per_second": 3.279, | |
| "step": 1640 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "learning_rate": 1.7171717171717173e-05, | |
| "loss": 0.6039, | |
| "step": 1680 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "eval_accuracy": 0.7182948490230906, | |
| "eval_f1_macro": 0.6829107741796993, | |
| "eval_f1_negative": 0.6881057268722467, | |
| "eval_f1_neutral": 0.7655158240854912, | |
| "eval_f1_positive": 0.5951107715813598, | |
| "eval_loss": 0.6307365298271179, | |
| "eval_precision_negative": 0.6878027300748569, | |
| "eval_precision_neutral": 0.7537434237150951, | |
| "eval_precision_positive": 0.6323051948051948, | |
| "eval_recall_negative": 0.6884089907448215, | |
| "eval_recall_neutral": 0.7776617954070981, | |
| "eval_recall_positive": 0.562049062049062, | |
| "eval_runtime": 13.423, | |
| "eval_samples_per_second": 629.145, | |
| "eval_steps_per_second": 3.278, | |
| "step": 1680 | |
| }, | |
| { | |
| "epoch": 1.45, | |
| "learning_rate": 1.7104377104377104e-05, | |
| "loss": 0.6059, | |
| "step": 1720 | |
| }, | |
| { | |
| "epoch": 1.45, | |
| "eval_accuracy": 0.7173475429248076, | |
| "eval_f1_macro": 0.6865160173058559, | |
| "eval_f1_negative": 0.6937445699391833, | |
| "eval_f1_neutral": 0.7605015673981192, | |
| "eval_f1_positive": 0.6053019145802652, | |
| "eval_loss": 0.6336551904678345, | |
| "eval_precision_negative": 0.6839400428265524, | |
| "eval_precision_neutral": 0.7612970711297071, | |
| "eval_precision_positive": 0.6180451127819548, | |
| "eval_recall_negative": 0.7038342882327017, | |
| "eval_recall_neutral": 0.7597077244258873, | |
| "eval_recall_positive": 0.5930735930735931, | |
| "eval_runtime": 13.4767, | |
| "eval_samples_per_second": 626.636, | |
| "eval_steps_per_second": 3.265, | |
| "step": 1720 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "learning_rate": 1.7037037037037038e-05, | |
| "loss": 0.6042, | |
| "step": 1760 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "eval_accuracy": 0.7197158081705151, | |
| "eval_f1_macro": 0.685440373432607, | |
| "eval_f1_negative": 0.694493006993007, | |
| "eval_f1_neutral": 0.7645846217274789, | |
| "eval_f1_positive": 0.5972434915773354, | |
| "eval_loss": 0.63006192445755, | |
| "eval_precision_negative": 0.6887732986562636, | |
| "eval_precision_neutral": 0.7550895765472313, | |
| "eval_precision_positive": 0.636215334420881, | |
| "eval_recall_negative": 0.7003085059497576, | |
| "eval_recall_neutral": 0.774321503131524, | |
| "eval_recall_positive": 0.5627705627705628, | |
| "eval_runtime": 13.4204, | |
| "eval_samples_per_second": 629.266, | |
| "eval_steps_per_second": 3.279, | |
| "step": 1760 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "learning_rate": 1.6969696969696972e-05, | |
| "loss": 0.5907, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "eval_accuracy": 0.7238602723505032, | |
| "eval_f1_macro": 0.6788816276493144, | |
| "eval_f1_negative": 0.6713483146067416, | |
| "eval_f1_neutral": 0.7784207945071114, | |
| "eval_f1_positive": 0.58687577383409, | |
| "eval_loss": 0.6279187202453613, | |
| "eval_precision_negative": 0.7159261108337494, | |
| "eval_precision_neutral": 0.7341350601295097, | |
| "eval_precision_positive": 0.6856316297010607, | |
| "eval_recall_negative": 0.6319964742177171, | |
| "eval_recall_neutral": 0.82839248434238, | |
| "eval_recall_positive": 0.512987012987013, | |
| "eval_runtime": 13.4379, | |
| "eval_samples_per_second": 628.446, | |
| "eval_steps_per_second": 3.274, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "learning_rate": 1.6902356902356903e-05, | |
| "loss": 0.6135, | |
| "step": 1840 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "eval_accuracy": 0.7229129662522202, | |
| "eval_f1_macro": 0.6795419420133372, | |
| "eval_f1_negative": 0.6882803943044906, | |
| "eval_f1_neutral": 0.7737461051361945, | |
| "eval_f1_positive": 0.5765993265993266, | |
| "eval_loss": 0.6268677711486816, | |
| "eval_precision_negative": 0.6842334494773519, | |
| "eval_precision_neutral": 0.7460748207016864, | |
| "eval_precision_positive": 0.6919191919191919, | |
| "eval_recall_negative": 0.6923754958131335, | |
| "eval_recall_neutral": 0.8035490605427975, | |
| "eval_recall_positive": 0.49422799422799424, | |
| "eval_runtime": 13.44, | |
| "eval_samples_per_second": 628.349, | |
| "eval_steps_per_second": 3.274, | |
| "step": 1840 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "learning_rate": 1.6835016835016837e-05, | |
| "loss": 0.5996, | |
| "step": 1880 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_accuracy": 0.7220840734162226, | |
| "eval_f1_macro": 0.6869855176473937, | |
| "eval_f1_negative": 0.6864864864864865, | |
| "eval_f1_neutral": 0.7696068445711958, | |
| "eval_f1_positive": 0.6048632218844986, | |
| "eval_loss": 0.6290135979652405, | |
| "eval_precision_negative": 0.7019806540764625, | |
| "eval_precision_neutral": 0.7513922036595068, | |
| "eval_precision_positive": 0.6388443017656501, | |
| "eval_recall_negative": 0.6716615249008374, | |
| "eval_recall_neutral": 0.7887265135699374, | |
| "eval_recall_positive": 0.5743145743145743, | |
| "eval_runtime": 13.4252, | |
| "eval_samples_per_second": 629.039, | |
| "eval_steps_per_second": 3.277, | |
| "step": 1880 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "learning_rate": 1.6767676767676768e-05, | |
| "loss": 0.6136, | |
| "step": 1920 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_accuracy": 0.7223208999407934, | |
| "eval_f1_macro": 0.6908988856510865, | |
| "eval_f1_negative": 0.7006585935840238, | |
| "eval_f1_neutral": 0.7644044755829762, | |
| "eval_f1_positive": 0.6076335877862595, | |
| "eval_loss": 0.6263943910598755, | |
| "eval_precision_negative": 0.6763740771123872, | |
| "eval_precision_neutral": 0.7657657657657657, | |
| "eval_precision_positive": 0.6450567260940032, | |
| "eval_recall_negative": 0.7267518730718379, | |
| "eval_recall_neutral": 0.7630480167014614, | |
| "eval_recall_positive": 0.5743145743145743, | |
| "eval_runtime": 13.5533, | |
| "eval_samples_per_second": 623.095, | |
| "eval_steps_per_second": 3.246, | |
| "step": 1920 | |
| }, | |
| { | |
| "epoch": 1.65, | |
| "learning_rate": 1.6700336700336702e-05, | |
| "loss": 0.6036, | |
| "step": 1960 | |
| }, | |
| { | |
| "epoch": 1.65, | |
| "eval_accuracy": 0.7141503848431024, | |
| "eval_f1_macro": 0.6879732554886911, | |
| "eval_f1_negative": 0.6988408851422551, | |
| "eval_f1_neutral": 0.7530068728522336, | |
| "eval_f1_positive": 0.6120720084715848, | |
| "eval_loss": 0.6364882588386536, | |
| "eval_precision_negative": 0.6696284329563813, | |
| "eval_precision_neutral": 0.7753206545776206, | |
| "eval_precision_positive": 0.5991706979958535, | |
| "eval_recall_negative": 0.7307183781401498, | |
| "eval_recall_neutral": 0.7319415448851775, | |
| "eval_recall_positive": 0.6255411255411255, | |
| "eval_runtime": 13.4324, | |
| "eval_samples_per_second": 628.703, | |
| "eval_steps_per_second": 3.276, | |
| "step": 1960 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "learning_rate": 1.6632996632996633e-05, | |
| "loss": 0.6123, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "eval_accuracy": 0.7198342214328005, | |
| "eval_f1_macro": 0.6811378179180303, | |
| "eval_f1_negative": 0.694331550802139, | |
| "eval_f1_neutral": 0.7660226924256361, | |
| "eval_f1_positive": 0.5830592105263157, | |
| "eval_loss": 0.6256130933761597, | |
| "eval_precision_negative": 0.6745635910224439, | |
| "eval_precision_neutral": 0.7504506308832365, | |
| "eval_precision_positive": 0.6778202676864244, | |
| "eval_recall_negative": 0.7152930806522697, | |
| "eval_recall_neutral": 0.7822546972860125, | |
| "eval_recall_positive": 0.5115440115440115, | |
| "eval_runtime": 13.4059, | |
| "eval_samples_per_second": 629.947, | |
| "eval_steps_per_second": 3.282, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "learning_rate": 1.6565656565656567e-05, | |
| "loss": 0.5898, | |
| "step": 2040 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "eval_accuracy": 0.7255180580224985, | |
| "eval_f1_macro": 0.6783018381472949, | |
| "eval_f1_negative": 0.6911698789780368, | |
| "eval_f1_neutral": 0.777568611909244, | |
| "eval_f1_positive": 0.5661670235546039, | |
| "eval_loss": 0.6203241944313049, | |
| "eval_precision_negative": 0.7031463748290013, | |
| "eval_precision_neutral": 0.7399585140486518, | |
| "eval_precision_positive": 0.6965226554267651, | |
| "eval_recall_negative": 0.6795945350374615, | |
| "eval_recall_neutral": 0.8192066805845512, | |
| "eval_recall_positive": 0.4769119769119769, | |
| "eval_runtime": 13.429, | |
| "eval_samples_per_second": 628.864, | |
| "eval_steps_per_second": 3.276, | |
| "step": 2040 | |
| }, | |
| { | |
| "epoch": 1.75, | |
| "learning_rate": 1.64983164983165e-05, | |
| "loss": 0.585, | |
| "step": 2080 | |
| }, | |
| { | |
| "epoch": 1.75, | |
| "eval_accuracy": 0.7277679100059207, | |
| "eval_f1_macro": 0.6856054160655031, | |
| "eval_f1_negative": 0.6840989399293286, | |
| "eval_f1_neutral": 0.7798319327731092, | |
| "eval_f1_positive": 0.5928853754940712, | |
| "eval_loss": 0.62270188331604, | |
| "eval_precision_negative": 0.7348178137651822, | |
| "eval_precision_neutral": 0.7406572769953051, | |
| "eval_precision_positive": 0.6555944055944056, | |
| "eval_recall_negative": 0.6399294843543412, | |
| "eval_recall_neutral": 0.8233820459290188, | |
| "eval_recall_positive": 0.5411255411255411, | |
| "eval_runtime": 13.4336, | |
| "eval_samples_per_second": 628.646, | |
| "eval_steps_per_second": 3.275, | |
| "step": 2080 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "learning_rate": 1.6430976430976432e-05, | |
| "loss": 0.6092, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "eval_accuracy": 0.7194789816459444, | |
| "eval_f1_macro": 0.691219851642046, | |
| "eval_f1_negative": 0.6904706700672385, | |
| "eval_f1_neutral": 0.7632427932146946, | |
| "eval_f1_positive": 0.6199460916442048, | |
| "eval_loss": 0.6305855512619019, | |
| "eval_precision_negative": 0.7284735812133072, | |
| "eval_precision_neutral": 0.7609462544096286, | |
| "eval_precision_positive": 0.5815423514538559, | |
| "eval_recall_negative": 0.6562362274129573, | |
| "eval_recall_neutral": 0.765553235908142, | |
| "eval_recall_positive": 0.6637806637806638, | |
| "eval_runtime": 13.4354, | |
| "eval_samples_per_second": 628.563, | |
| "eval_steps_per_second": 3.275, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "learning_rate": 1.6363636363636366e-05, | |
| "loss": 0.5902, | |
| "step": 2160 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "eval_accuracy": 0.7217288336293665, | |
| "eval_f1_macro": 0.6903674148692266, | |
| "eval_f1_negative": 0.699802067297119, | |
| "eval_f1_neutral": 0.7650182196772514, | |
| "eval_f1_positive": 0.606281957633309, | |
| "eval_loss": 0.6268182992935181, | |
| "eval_precision_negative": 0.6984196663740123, | |
| "eval_precision_neutral": 0.7630321910695742, | |
| "eval_precision_positive": 0.613905325443787, | |
| "eval_recall_negative": 0.7011899515204936, | |
| "eval_recall_neutral": 0.7670146137787056, | |
| "eval_recall_positive": 0.5988455988455988, | |
| "eval_runtime": 13.453, | |
| "eval_samples_per_second": 627.739, | |
| "eval_steps_per_second": 3.271, | |
| "step": 2160 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "learning_rate": 1.6296296296296297e-05, | |
| "loss": 0.6077, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "eval_accuracy": 0.7239786856127887, | |
| "eval_f1_macro": 0.6863881436307776, | |
| "eval_f1_negative": 0.6860517946388005, | |
| "eval_f1_neutral": 0.7731126362535325, | |
| "eval_f1_positive": 0.5999999999999999, | |
| "eval_loss": 0.6207541227340698, | |
| "eval_precision_negative": 0.7079231129864041, | |
| "eval_precision_neutral": 0.7483391949980461, | |
| "eval_precision_positive": 0.6482412060301508, | |
| "eval_recall_negative": 0.6654914059056853, | |
| "eval_recall_neutral": 0.7995824634655533, | |
| "eval_recall_positive": 0.5584415584415584, | |
| "eval_runtime": 13.4434, | |
| "eval_samples_per_second": 628.189, | |
| "eval_steps_per_second": 3.273, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "learning_rate": 1.622895622895623e-05, | |
| "loss": 0.5971, | |
| "step": 2240 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "eval_accuracy": 0.7297809354647721, | |
| "eval_f1_macro": 0.6928803015060957, | |
| "eval_f1_negative": 0.6937485894831867, | |
| "eval_f1_neutral": 0.7777216213484281, | |
| "eval_f1_positive": 0.6071706936866719, | |
| "eval_loss": 0.6181867122650146, | |
| "eval_precision_negative": 0.7109158186864015, | |
| "eval_precision_neutral": 0.7538702723887909, | |
| "eval_precision_positive": 0.6601694915254237, | |
| "eval_recall_negative": 0.6773909211106214, | |
| "eval_recall_neutral": 0.8031315240083508, | |
| "eval_recall_positive": 0.562049062049062, | |
| "eval_runtime": 13.5165, | |
| "eval_samples_per_second": 624.792, | |
| "eval_steps_per_second": 3.255, | |
| "step": 2240 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "learning_rate": 1.616161616161616e-05, | |
| "loss": 0.6053, | |
| "step": 2280 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "eval_accuracy": 0.7235050325636472, | |
| "eval_f1_macro": 0.6869805131510361, | |
| "eval_f1_negative": 0.6891179839633448, | |
| "eval_f1_neutral": 0.7715961966417155, | |
| "eval_f1_positive": 0.6002273588480483, | |
| "eval_loss": 0.6221389174461365, | |
| "eval_precision_negative": 0.7175572519083969, | |
| "eval_precision_neutral": 0.7484301412872841, | |
| "eval_precision_positive": 0.6320830007980845, | |
| "eval_recall_negative": 0.6628470691934774, | |
| "eval_recall_neutral": 0.7962421711899791, | |
| "eval_recall_positive": 0.5714285714285714, | |
| "eval_runtime": 13.4474, | |
| "eval_samples_per_second": 628.005, | |
| "eval_steps_per_second": 3.272, | |
| "step": 2280 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "learning_rate": 1.6094276094276096e-05, | |
| "loss": 0.5959, | |
| "step": 2320 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "eval_accuracy": 0.7199526346950859, | |
| "eval_f1_macro": 0.682651116707718, | |
| "eval_f1_negative": 0.6665057915057916, | |
| "eval_f1_neutral": 0.7722100219604712, | |
| "eval_f1_positive": 0.6092375366568915, | |
| "eval_loss": 0.6313912272453308, | |
| "eval_precision_negative": 0.7365333333333334, | |
| "eval_precision_neutral": 0.7398622800306044, | |
| "eval_precision_positive": 0.6192250372578242, | |
| "eval_recall_negative": 0.6086381665932129, | |
| "eval_recall_neutral": 0.8075156576200417, | |
| "eval_recall_positive": 0.5995670995670995, | |
| "eval_runtime": 13.532, | |
| "eval_samples_per_second": 624.078, | |
| "eval_steps_per_second": 3.252, | |
| "step": 2320 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "learning_rate": 1.602693602693603e-05, | |
| "loss": 0.6196, | |
| "step": 2360 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "eval_accuracy": 0.709295441089402, | |
| "eval_f1_macro": 0.6881296895840747, | |
| "eval_f1_negative": 0.700795870079587, | |
| "eval_f1_neutral": 0.7440385036097135, | |
| "eval_f1_positive": 0.6195546950629235, | |
| "eval_loss": 0.6360026001930237, | |
| "eval_precision_negative": 0.684453781512605, | |
| "eval_precision_neutral": 0.7814797794117647, | |
| "eval_precision_positive": 0.5604203152364273, | |
| "eval_recall_negative": 0.7179374173644777, | |
| "eval_recall_neutral": 0.7100208768267223, | |
| "eval_recall_positive": 0.6926406926406926, | |
| "eval_runtime": 13.7523, | |
| "eval_samples_per_second": 614.079, | |
| "eval_steps_per_second": 3.199, | |
| "step": 2360 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "learning_rate": 1.595959595959596e-05, | |
| "loss": 0.5686, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "eval_accuracy": 0.7191237418590882, | |
| "eval_f1_macro": 0.6870370031512542, | |
| "eval_f1_negative": 0.6933101650738488, | |
| "eval_f1_neutral": 0.7630622208372286, | |
| "eval_f1_positive": 0.6047386235426853, | |
| "eval_loss": 0.6405708193778992, | |
| "eval_precision_negative": 0.6835117773019272, | |
| "eval_precision_neutral": 0.7593549720901385, | |
| "eval_precision_positive": 0.631578947368421, | |
| "eval_recall_negative": 0.7033935654473337, | |
| "eval_recall_neutral": 0.7668058455114822, | |
| "eval_recall_positive": 0.5800865800865801, | |
| "eval_runtime": 13.5092, | |
| "eval_samples_per_second": 625.128, | |
| "eval_steps_per_second": 3.257, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 2.05, | |
| "learning_rate": 1.5892255892255895e-05, | |
| "loss": 0.5586, | |
| "step": 2440 | |
| }, | |
| { | |
| "epoch": 2.05, | |
| "eval_accuracy": 0.7223208999407934, | |
| "eval_f1_macro": 0.6862310990226811, | |
| "eval_f1_negative": 0.6942959001782532, | |
| "eval_f1_neutral": 0.7689950980392158, | |
| "eval_f1_positive": 0.5954022988505746, | |
| "eval_loss": 0.6309220790863037, | |
| "eval_precision_negative": 0.7021180712032447, | |
| "eval_precision_neutral": 0.7526989204318273, | |
| "eval_precision_positive": 0.6348039215686274, | |
| "eval_recall_negative": 0.6866460996033495, | |
| "eval_recall_neutral": 0.7860125260960334, | |
| "eval_recall_positive": 0.5606060606060606, | |
| "eval_runtime": 13.5411, | |
| "eval_samples_per_second": 623.656, | |
| "eval_steps_per_second": 3.249, | |
| "step": 2440 | |
| }, | |
| { | |
| "epoch": 2.09, | |
| "learning_rate": 1.5824915824915825e-05, | |
| "loss": 0.5671, | |
| "step": 2480 | |
| }, | |
| { | |
| "epoch": 2.09, | |
| "eval_accuracy": 0.7205447010065127, | |
| "eval_f1_macro": 0.683056392123643, | |
| "eval_f1_negative": 0.6914449087310313, | |
| "eval_f1_neutral": 0.7678189048638727, | |
| "eval_f1_positive": 0.5899053627760252, | |
| "eval_loss": 0.6297855377197266, | |
| "eval_precision_negative": 0.6900790166812993, | |
| "eval_precision_neutral": 0.7504484751843731, | |
| "eval_precision_positive": 0.6504347826086957, | |
| "eval_recall_negative": 0.6928162185985015, | |
| "eval_recall_neutral": 0.7860125260960334, | |
| "eval_recall_positive": 0.5396825396825397, | |
| "eval_runtime": 13.5165, | |
| "eval_samples_per_second": 624.793, | |
| "eval_steps_per_second": 3.255, | |
| "step": 2480 | |
| }, | |
| { | |
| "epoch": 2.12, | |
| "learning_rate": 1.575757575757576e-05, | |
| "loss": 0.5458, | |
| "step": 2520 | |
| }, | |
| { | |
| "epoch": 2.12, | |
| "eval_accuracy": 0.7214920071047958, | |
| "eval_f1_macro": 0.6872366815721698, | |
| "eval_f1_negative": 0.6905083220872694, | |
| "eval_f1_neutral": 0.7679083094555873, | |
| "eval_f1_positive": 0.6032934131736527, | |
| "eval_loss": 0.63502436876297, | |
| "eval_precision_negative": 0.7050987597611392, | |
| "eval_precision_neutral": 0.7531112003211562, | |
| "eval_precision_positive": 0.6267496111975117, | |
| "eval_recall_negative": 0.6765094755398854, | |
| "eval_recall_neutral": 0.7832985386221294, | |
| "eval_recall_positive": 0.5815295815295816, | |
| "eval_runtime": 13.5006, | |
| "eval_samples_per_second": 625.526, | |
| "eval_steps_per_second": 3.259, | |
| "step": 2520 | |
| }, | |
| { | |
| "epoch": 2.15, | |
| "learning_rate": 1.569023569023569e-05, | |
| "loss": 0.5617, | |
| "step": 2560 | |
| }, | |
| { | |
| "epoch": 2.15, | |
| "eval_accuracy": 0.7103611604499704, | |
| "eval_f1_macro": 0.6868863746975769, | |
| "eval_f1_negative": 0.7016379846568526, | |
| "eval_f1_neutral": 0.7452902101709682, | |
| "eval_f1_positive": 0.6137309292649098, | |
| "eval_loss": 0.6412296891212463, | |
| "eval_precision_negative": 0.6624902114330462, | |
| "eval_precision_neutral": 0.7789665376735716, | |
| "eval_precision_positive": 0.5907877169559412, | |
| "eval_recall_negative": 0.745702952842662, | |
| "eval_recall_neutral": 0.7144050104384133, | |
| "eval_recall_positive": 0.6385281385281385, | |
| "eval_runtime": 13.561, | |
| "eval_samples_per_second": 622.74, | |
| "eval_steps_per_second": 3.245, | |
| "step": 2560 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "learning_rate": 1.5622895622895624e-05, | |
| "loss": 0.5582, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "eval_accuracy": 0.7085849615156897, | |
| "eval_f1_macro": 0.687474213023077, | |
| "eval_f1_negative": 0.699581589958159, | |
| "eval_f1_neutral": 0.7421052631578948, | |
| "eval_f1_positive": 0.6207357859531774, | |
| "eval_loss": 0.6525644659996033, | |
| "eval_precision_negative": 0.6658701712465154, | |
| "eval_precision_neutral": 0.7815242494226328, | |
| "eval_precision_positive": 0.5785536159600998, | |
| "eval_recall_negative": 0.7368884971353019, | |
| "eval_recall_neutral": 0.7064718162839249, | |
| "eval_recall_positive": 0.6695526695526696, | |
| "eval_runtime": 13.5361, | |
| "eval_samples_per_second": 623.888, | |
| "eval_steps_per_second": 3.251, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "learning_rate": 1.555555555555556e-05, | |
| "loss": 0.5543, | |
| "step": 2640 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "eval_accuracy": 0.7201894612196567, | |
| "eval_f1_macro": 0.6869432555451471, | |
| "eval_f1_negative": 0.7009306260575296, | |
| "eval_f1_neutral": 0.762918885061071, | |
| "eval_f1_positive": 0.5969802555168409, | |
| "eval_loss": 0.640322744846344, | |
| "eval_precision_negative": 0.6738511590077267, | |
| "eval_precision_neutral": 0.7629985383169764, | |
| "eval_precision_positive": 0.6441102756892231, | |
| "eval_recall_negative": 0.7302776553547818, | |
| "eval_recall_neutral": 0.762839248434238, | |
| "eval_recall_positive": 0.5562770562770563, | |
| "eval_runtime": 13.5133, | |
| "eval_samples_per_second": 624.941, | |
| "eval_steps_per_second": 3.256, | |
| "step": 2640 | |
| }, | |
| { | |
| "epoch": 2.26, | |
| "learning_rate": 1.548821548821549e-05, | |
| "loss": 0.558, | |
| "step": 2680 | |
| }, | |
| { | |
| "epoch": 2.26, | |
| "eval_accuracy": 0.7206631142687981, | |
| "eval_f1_macro": 0.6874230644596926, | |
| "eval_f1_negative": 0.697239536954586, | |
| "eval_f1_neutral": 0.7653250773993808, | |
| "eval_f1_positive": 0.5997045790251108, | |
| "eval_loss": 0.6337417364120483, | |
| "eval_precision_negative": 0.7044534412955465, | |
| "eval_precision_neutral": 0.756734693877551, | |
| "eval_precision_positive": 0.6142208774583964, | |
| "eval_recall_negative": 0.6901718818862935, | |
| "eval_recall_neutral": 0.7741127348643007, | |
| "eval_recall_positive": 0.5858585858585859, | |
| "eval_runtime": 13.5113, | |
| "eval_samples_per_second": 625.032, | |
| "eval_steps_per_second": 3.257, | |
| "step": 2680 | |
| }, | |
| { | |
| "epoch": 2.29, | |
| "learning_rate": 1.5420875420875423e-05, | |
| "loss": 0.5506, | |
| "step": 2720 | |
| }, | |
| { | |
| "epoch": 2.29, | |
| "eval_accuracy": 0.7171107164002368, | |
| "eval_f1_macro": 0.6895025450757618, | |
| "eval_f1_negative": 0.7093775262732418, | |
| "eval_f1_neutral": 0.753454231433506, | |
| "eval_f1_positive": 0.6056758775205378, | |
| "eval_loss": 0.6484044194221497, | |
| "eval_precision_negative": 0.6550951847704367, | |
| "eval_precision_neutral": 0.7800625838176128, | |
| "eval_precision_positive": 0.6277089783281734, | |
| "eval_recall_negative": 0.7734684883208461, | |
| "eval_recall_neutral": 0.7286012526096033, | |
| "eval_recall_positive": 0.5851370851370852, | |
| "eval_runtime": 13.5135, | |
| "eval_samples_per_second": 624.931, | |
| "eval_steps_per_second": 3.256, | |
| "step": 2720 | |
| }, | |
| { | |
| "epoch": 2.32, | |
| "learning_rate": 1.5353535353535354e-05, | |
| "loss": 0.5569, | |
| "step": 2760 | |
| }, | |
| { | |
| "epoch": 2.32, | |
| "eval_accuracy": 0.7167554766133807, | |
| "eval_f1_macro": 0.6895340612929335, | |
| "eval_f1_negative": 0.7063525452250736, | |
| "eval_f1_neutral": 0.7544910179640718, | |
| "eval_f1_positive": 0.6077586206896551, | |
| "eval_loss": 0.6315791606903076, | |
| "eval_precision_negative": 0.6756539235412475, | |
| "eval_precision_neutral": 0.7733450241122315, | |
| "eval_precision_positive": 0.6051502145922747, | |
| "eval_recall_negative": 0.7399735566328779, | |
| "eval_recall_neutral": 0.7365344467640919, | |
| "eval_recall_positive": 0.6103896103896104, | |
| "eval_runtime": 13.5058, | |
| "eval_samples_per_second": 625.287, | |
| "eval_steps_per_second": 3.258, | |
| "step": 2760 | |
| }, | |
| { | |
| "epoch": 2.36, | |
| "learning_rate": 1.5286195286195288e-05, | |
| "loss": 0.5469, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 2.36, | |
| "eval_accuracy": 0.7182948490230906, | |
| "eval_f1_macro": 0.69129222470535, | |
| "eval_f1_negative": 0.7031543764361813, | |
| "eval_f1_neutral": 0.7562953478446436, | |
| "eval_f1_positive": 0.6144269498352252, | |
| "eval_loss": 0.6461361646652222, | |
| "eval_precision_negative": 0.6683876092136616, | |
| "eval_precision_neutral": 0.7734613705805325, | |
| "eval_precision_positive": 0.6237918215613383, | |
| "eval_recall_negative": 0.7417364477743499, | |
| "eval_recall_neutral": 0.7398747390396659, | |
| "eval_recall_positive": 0.6053391053391053, | |
| "eval_runtime": 13.5002, | |
| "eval_samples_per_second": 625.546, | |
| "eval_steps_per_second": 3.259, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 2.39, | |
| "learning_rate": 1.521885521885522e-05, | |
| "loss": 0.5497, | |
| "step": 2840 | |
| }, | |
| { | |
| "epoch": 2.39, | |
| "eval_accuracy": 0.7205447010065127, | |
| "eval_f1_macro": 0.6901740903513232, | |
| "eval_f1_negative": 0.6989695242271432, | |
| "eval_f1_neutral": 0.7628887497390942, | |
| "eval_f1_positive": 0.608663997087732, | |
| "eval_loss": 0.6306228041648865, | |
| "eval_precision_negative": 0.6954624781849913, | |
| "eval_precision_neutral": 0.7627295492487479, | |
| "eval_precision_positive": 0.6142542248346804, | |
| "eval_recall_negative": 0.7025121198765977, | |
| "eval_recall_neutral": 0.7630480167014614, | |
| "eval_recall_positive": 0.6031746031746031, | |
| "eval_runtime": 13.5161, | |
| "eval_samples_per_second": 624.81, | |
| "eval_steps_per_second": 3.255, | |
| "step": 2840 | |
| }, | |
| { | |
| "epoch": 2.42, | |
| "learning_rate": 1.5151515151515153e-05, | |
| "loss": 0.5577, | |
| "step": 2880 | |
| }, | |
| { | |
| "epoch": 2.42, | |
| "eval_accuracy": 0.7149792776791001, | |
| "eval_f1_macro": 0.686526091020862, | |
| "eval_f1_negative": 0.6968478950708694, | |
| "eval_f1_neutral": 0.7555225148683093, | |
| "eval_f1_positive": 0.6072078631234074, | |
| "eval_loss": 0.6409549713134766, | |
| "eval_precision_negative": 0.6700569568755086, | |
| "eval_precision_neutral": 0.7689148292261133, | |
| "eval_precision_positive": 0.6127847171197649, | |
| "eval_recall_negative": 0.7258704275011018, | |
| "eval_recall_neutral": 0.7425887265135699, | |
| "eval_recall_positive": 0.6017316017316018, | |
| "eval_runtime": 13.6855, | |
| "eval_samples_per_second": 617.076, | |
| "eval_steps_per_second": 3.215, | |
| "step": 2880 | |
| }, | |
| { | |
| "epoch": 2.46, | |
| "learning_rate": 1.5084175084175085e-05, | |
| "loss": 0.557, | |
| "step": 2920 | |
| }, | |
| { | |
| "epoch": 2.46, | |
| "eval_accuracy": 0.7225577264653641, | |
| "eval_f1_macro": 0.6876490677339296, | |
| "eval_f1_negative": 0.7071207430340557, | |
| "eval_f1_neutral": 0.7645151166440004, | |
| "eval_f1_positive": 0.5913113435237329, | |
| "eval_loss": 0.6443095803260803, | |
| "eval_precision_negative": 0.6649844720496895, | |
| "eval_precision_neutral": 0.7661983644369889, | |
| "eval_precision_positive": 0.6681818181818182, | |
| "eval_recall_negative": 0.75495813133539, | |
| "eval_recall_neutral": 0.762839248434238, | |
| "eval_recall_positive": 0.5303030303030303, | |
| "eval_runtime": 13.5647, | |
| "eval_samples_per_second": 622.57, | |
| "eval_steps_per_second": 3.244, | |
| "step": 2920 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "learning_rate": 1.5016835016835018e-05, | |
| "loss": 0.5542, | |
| "step": 2960 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "eval_accuracy": 0.7161634103019539, | |
| "eval_f1_macro": 0.687092758801656, | |
| "eval_f1_negative": 0.7009579341940858, | |
| "eval_f1_neutral": 0.7560144773259526, | |
| "eval_f1_positive": 0.6043058648849294, | |
| "eval_loss": 0.6480274796485901, | |
| "eval_precision_negative": 0.6644295302013423, | |
| "eval_precision_neutral": 0.7712858384013901, | |
| "eval_precision_positive": 0.6223241590214067, | |
| "eval_recall_negative": 0.7417364477743499, | |
| "eval_recall_neutral": 0.7413361169102296, | |
| "eval_recall_positive": 0.5873015873015873, | |
| "eval_runtime": 13.5134, | |
| "eval_samples_per_second": 624.935, | |
| "eval_steps_per_second": 3.256, | |
| "step": 2960 | |
| }, | |
| { | |
| "epoch": 2.53, | |
| "learning_rate": 1.4949494949494952e-05, | |
| "loss": 0.567, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 2.53, | |
| "eval_accuracy": 0.7079928952042629, | |
| "eval_f1_macro": 0.6865435263558487, | |
| "eval_f1_negative": 0.7025898078529658, | |
| "eval_f1_neutral": 0.7416051965209732, | |
| "eval_f1_positive": 0.6154355746936071, | |
| "eval_loss": 0.6429863572120667, | |
| "eval_precision_negative": 0.6677252878126241, | |
| "eval_precision_neutral": 0.7845329606335896, | |
| "eval_precision_positive": 0.5688916105327618, | |
| "eval_recall_negative": 0.7412957249889819, | |
| "eval_recall_neutral": 0.7031315240083508, | |
| "eval_recall_positive": 0.6702741702741702, | |
| "eval_runtime": 13.5159, | |
| "eval_samples_per_second": 624.818, | |
| "eval_steps_per_second": 3.255, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 2.56, | |
| "learning_rate": 1.4882154882154884e-05, | |
| "loss": 0.5606, | |
| "step": 3040 | |
| }, | |
| { | |
| "epoch": 2.56, | |
| "eval_accuracy": 0.7155713439905269, | |
| "eval_f1_macro": 0.6890929890491521, | |
| "eval_f1_negative": 0.7017241379310344, | |
| "eval_f1_neutral": 0.7549994652978291, | |
| "eval_f1_positive": 0.6105553639185926, | |
| "eval_loss": 0.6457778811454773, | |
| "eval_precision_negative": 0.6866301138760017, | |
| "eval_precision_neutral": 0.7739530804648104, | |
| "eval_precision_positive": 0.5849306014540647, | |
| "eval_recall_negative": 0.7174966945791097, | |
| "eval_recall_neutral": 0.7369519832985386, | |
| "eval_recall_positive": 0.6385281385281385, | |
| "eval_runtime": 13.5186, | |
| "eval_samples_per_second": 624.694, | |
| "eval_steps_per_second": 3.255, | |
| "step": 3040 | |
| }, | |
| { | |
| "epoch": 2.59, | |
| "learning_rate": 1.4814814814814815e-05, | |
| "loss": 0.5492, | |
| "step": 3080 | |
| }, | |
| { | |
| "epoch": 2.59, | |
| "eval_accuracy": 0.713676731793961, | |
| "eval_f1_macro": 0.687090376547261, | |
| "eval_f1_negative": 0.6999178981937603, | |
| "eval_f1_neutral": 0.7514812021975654, | |
| "eval_f1_positive": 0.6098720292504571, | |
| "eval_loss": 0.646338164806366, | |
| "eval_precision_negative": 0.6550134460238187, | |
| "eval_precision_neutral": 0.7763187180057868, | |
| "eval_precision_positive": 0.6182357301704967, | |
| "eval_recall_negative": 0.751432349052446, | |
| "eval_recall_neutral": 0.7281837160751565, | |
| "eval_recall_positive": 0.6017316017316018, | |
| "eval_runtime": 13.5425, | |
| "eval_samples_per_second": 623.591, | |
| "eval_steps_per_second": 3.249, | |
| "step": 3080 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "learning_rate": 1.4747474747474747e-05, | |
| "loss": 0.5509, | |
| "step": 3120 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "eval_accuracy": 0.7187685020722321, | |
| "eval_f1_macro": 0.6907132499480086, | |
| "eval_f1_negative": 0.7029375258585022, | |
| "eval_f1_neutral": 0.7576566001493972, | |
| "eval_f1_positive": 0.6115456238361267, | |
| "eval_loss": 0.6359885334968567, | |
| "eval_precision_negative": 0.6623781676413255, | |
| "eval_precision_neutral": 0.7749399694389871, | |
| "eval_precision_positive": 0.6320246343341032, | |
| "eval_recall_negative": 0.748788012340238, | |
| "eval_recall_neutral": 0.7411273486430062, | |
| "eval_recall_positive": 0.5923520923520924, | |
| "eval_runtime": 13.4528, | |
| "eval_samples_per_second": 627.753, | |
| "eval_steps_per_second": 3.271, | |
| "step": 3120 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "learning_rate": 1.4680134680134681e-05, | |
| "loss": 0.5626, | |
| "step": 3160 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "eval_accuracy": 0.7175843694493783, | |
| "eval_f1_macro": 0.6878133884212742, | |
| "eval_f1_negative": 0.7006661115736886, | |
| "eval_f1_neutral": 0.7580354301474488, | |
| "eval_f1_positive": 0.6047386235426853, | |
| "eval_loss": 0.6416473984718323, | |
| "eval_precision_negative": 0.663905325443787, | |
| "eval_precision_neutral": 0.770541298253181, | |
| "eval_precision_positive": 0.631578947368421, | |
| "eval_recall_negative": 0.7417364477743499, | |
| "eval_recall_neutral": 0.7459290187891441, | |
| "eval_recall_positive": 0.5800865800865801, | |
| "eval_runtime": 13.5444, | |
| "eval_samples_per_second": 623.505, | |
| "eval_steps_per_second": 3.249, | |
| "step": 3160 | |
| }, | |
| { | |
| "epoch": 2.69, | |
| "learning_rate": 1.4612794612794614e-05, | |
| "loss": 0.5589, | |
| "step": 3200 | |
| }, | |
| { | |
| "epoch": 2.69, | |
| "eval_accuracy": 0.7187685020722321, | |
| "eval_f1_macro": 0.6920386854465886, | |
| "eval_f1_negative": 0.706980691703798, | |
| "eval_f1_neutral": 0.7570633561643835, | |
| "eval_f1_positive": 0.6120720084715848, | |
| "eval_loss": 0.6367910504341125, | |
| "eval_precision_negative": 0.6816693944353519, | |
| "eval_precision_neutral": 0.7766798418972332, | |
| "eval_precision_positive": 0.5991706979958535, | |
| "eval_recall_negative": 0.7342441604230939, | |
| "eval_recall_neutral": 0.7384133611691023, | |
| "eval_recall_positive": 0.6255411255411255, | |
| "eval_runtime": 13.5341, | |
| "eval_samples_per_second": 623.979, | |
| "eval_steps_per_second": 3.251, | |
| "step": 3200 | |
| }, | |
| { | |
| "epoch": 2.73, | |
| "learning_rate": 1.4545454545454546e-05, | |
| "loss": 0.5499, | |
| "step": 3240 | |
| }, | |
| { | |
| "epoch": 2.73, | |
| "eval_accuracy": 0.7135583185316755, | |
| "eval_f1_macro": 0.6872354106917024, | |
| "eval_f1_negative": 0.7027480595762535, | |
| "eval_f1_neutral": 0.7509126046811251, | |
| "eval_f1_positive": 0.6080455678177287, | |
| "eval_loss": 0.6405165791511536, | |
| "eval_precision_negative": 0.6705364291433147, | |
| "eval_precision_neutral": 0.7729885057471264, | |
| "eval_precision_positive": 0.6001405481377372, | |
| "eval_recall_negative": 0.7382106654914059, | |
| "eval_recall_neutral": 0.7300626304801671, | |
| "eval_recall_positive": 0.6161616161616161, | |
| "eval_runtime": 13.5535, | |
| "eval_samples_per_second": 623.087, | |
| "eval_steps_per_second": 3.246, | |
| "step": 3240 | |
| }, | |
| { | |
| "epoch": 2.76, | |
| "learning_rate": 1.447811447811448e-05, | |
| "loss": 0.5431, | |
| "step": 3280 | |
| }, | |
| { | |
| "epoch": 2.76, | |
| "eval_accuracy": 0.7207815275310835, | |
| "eval_f1_macro": 0.6892335124121108, | |
| "eval_f1_negative": 0.7012817727568977, | |
| "eval_f1_neutral": 0.7629961454318157, | |
| "eval_f1_positive": 0.6034226190476191, | |
| "eval_loss": 0.6356926560401917, | |
| "eval_precision_negative": 0.6915167095115681, | |
| "eval_precision_neutral": 0.7614888750259929, | |
| "eval_precision_positive": 0.6228878648233487, | |
| "eval_recall_negative": 0.7113265755839577, | |
| "eval_recall_neutral": 0.764509394572025, | |
| "eval_recall_positive": 0.5851370851370852, | |
| "eval_runtime": 13.6103, | |
| "eval_samples_per_second": 620.484, | |
| "eval_steps_per_second": 3.233, | |
| "step": 3280 | |
| }, | |
| { | |
| "epoch": 2.79, | |
| "learning_rate": 1.4410774410774413e-05, | |
| "loss": 0.5388, | |
| "step": 3320 | |
| }, | |
| { | |
| "epoch": 2.79, | |
| "eval_accuracy": 0.7103611604499704, | |
| "eval_f1_macro": 0.6887331835620346, | |
| "eval_f1_negative": 0.7057600332709503, | |
| "eval_f1_neutral": 0.7435107787065551, | |
| "eval_f1_positive": 0.6169287387085982, | |
| "eval_loss": 0.6553226113319397, | |
| "eval_precision_negative": 0.6681102362204724, | |
| "eval_precision_neutral": 0.7856810785681079, | |
| "eval_precision_positive": 0.5751715533374921, | |
| "eval_recall_negative": 0.747906566769502, | |
| "eval_recall_neutral": 0.7056367432150313, | |
| "eval_recall_positive": 0.6652236652236653, | |
| "eval_runtime": 13.4151, | |
| "eval_samples_per_second": 629.514, | |
| "eval_steps_per_second": 3.28, | |
| "step": 3320 | |
| }, | |
| { | |
| "epoch": 2.83, | |
| "learning_rate": 1.4343434343434344e-05, | |
| "loss": 0.5613, | |
| "step": 3360 | |
| }, | |
| { | |
| "epoch": 2.83, | |
| "eval_accuracy": 0.7232682060390764, | |
| "eval_f1_macro": 0.6875059651526924, | |
| "eval_f1_negative": 0.7051926298157454, | |
| "eval_f1_neutral": 0.7659927423535511, | |
| "eval_f1_positive": 0.5913325232887808, | |
| "eval_loss": 0.6239017844200134, | |
| "eval_precision_negative": 0.6717191862784204, | |
| "eval_precision_neutral": 0.76086508753862, | |
| "eval_precision_positive": 0.6740535549399815, | |
| "eval_recall_negative": 0.742177170559718, | |
| "eval_recall_neutral": 0.7711899791231733, | |
| "eval_recall_positive": 0.5266955266955267, | |
| "eval_runtime": 13.4098, | |
| "eval_samples_per_second": 629.763, | |
| "eval_steps_per_second": 3.281, | |
| "step": 3360 | |
| }, | |
| { | |
| "epoch": 2.86, | |
| "learning_rate": 1.4276094276094276e-05, | |
| "loss": 0.556, | |
| "step": 3400 | |
| }, | |
| { | |
| "epoch": 2.86, | |
| "eval_accuracy": 0.7217288336293665, | |
| "eval_f1_macro": 0.6902285547620584, | |
| "eval_f1_negative": 0.7011167068097219, | |
| "eval_f1_neutral": 0.7648837451777708, | |
| "eval_f1_positive": 0.6046852122986822, | |
| "eval_loss": 0.6339342594146729, | |
| "eval_precision_negative": 0.696692776327241, | |
| "eval_precision_neutral": 0.7640074984378254, | |
| "eval_precision_positive": 0.6136701337295691, | |
| "eval_recall_negative": 0.7055971793741737, | |
| "eval_recall_neutral": 0.7657620041753653, | |
| "eval_recall_positive": 0.5959595959595959, | |
| "eval_runtime": 13.436, | |
| "eval_samples_per_second": 628.537, | |
| "eval_steps_per_second": 3.275, | |
| "step": 3400 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "learning_rate": 1.420875420875421e-05, | |
| "loss": 0.5536, | |
| "step": 3440 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "eval_accuracy": 0.7108348134991119, | |
| "eval_f1_macro": 0.6898151957724491, | |
| "eval_f1_negative": 0.7129761662253005, | |
| "eval_f1_neutral": 0.7415480427046264, | |
| "eval_f1_positive": 0.6149213783874204, | |
| "eval_loss": 0.659329891204834, | |
| "eval_precision_negative": 0.6628787878787878, | |
| "eval_precision_neutral": 0.7934316991908615, | |
| "eval_precision_positive": 0.5733000623830318, | |
| "eval_recall_negative": 0.7712648743940062, | |
| "eval_recall_neutral": 0.6960334029227557, | |
| "eval_recall_positive": 0.663059163059163, | |
| "eval_runtime": 13.4431, | |
| "eval_samples_per_second": 628.201, | |
| "eval_steps_per_second": 3.273, | |
| "step": 3440 | |
| }, | |
| { | |
| "epoch": 2.93, | |
| "learning_rate": 1.4141414141414143e-05, | |
| "loss": 0.5663, | |
| "step": 3480 | |
| }, | |
| { | |
| "epoch": 2.93, | |
| "eval_accuracy": 0.7154529307282416, | |
| "eval_f1_macro": 0.6878232234805552, | |
| "eval_f1_negative": 0.6974677920924034, | |
| "eval_f1_neutral": 0.7573062261753494, | |
| "eval_f1_positive": 0.6086956521739131, | |
| "eval_loss": 0.6353215575218201, | |
| "eval_precision_negative": 0.703090013434841, | |
| "eval_precision_neutral": 0.7683712935109583, | |
| "eval_precision_positive": 0.5750962772785623, | |
| "eval_recall_negative": 0.6919347730277655, | |
| "eval_recall_neutral": 0.7465553235908142, | |
| "eval_recall_positive": 0.6464646464646465, | |
| "eval_runtime": 13.4095, | |
| "eval_samples_per_second": 629.78, | |
| "eval_steps_per_second": 3.281, | |
| "step": 3480 | |
| }, | |
| { | |
| "epoch": 2.96, | |
| "learning_rate": 1.4074074074074075e-05, | |
| "loss": 0.5499, | |
| "step": 3520 | |
| }, | |
| { | |
| "epoch": 2.96, | |
| "eval_accuracy": 0.7143872113676731, | |
| "eval_f1_macro": 0.6899472024314622, | |
| "eval_f1_negative": 0.7078491335372069, | |
| "eval_f1_neutral": 0.7488017429193901, | |
| "eval_f1_positive": 0.6131907308377897, | |
| "eval_loss": 0.6429401636123657, | |
| "eval_precision_negative": 0.6585735963581184, | |
| "eval_precision_neutral": 0.7829157175398633, | |
| "eval_precision_positive": 0.6060606060606061, | |
| "eval_recall_negative": 0.7650947553988541, | |
| "eval_recall_neutral": 0.7175365344467641, | |
| "eval_recall_positive": 0.6204906204906205, | |
| "eval_runtime": 13.4298, | |
| "eval_samples_per_second": 628.824, | |
| "eval_steps_per_second": 3.276, | |
| "step": 3520 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 1.4006734006734009e-05, | |
| "loss": 0.5619, | |
| "step": 3560 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.7207815275310835, | |
| "eval_f1_macro": 0.6934678744913757, | |
| "eval_f1_negative": 0.7042136003337507, | |
| "eval_f1_neutral": 0.759215853398679, | |
| "eval_f1_positive": 0.6169741697416974, | |
| "eval_loss": 0.6337869167327881, | |
| "eval_precision_negative": 0.6685148514851486, | |
| "eval_precision_neutral": 0.7752393385552655, | |
| "eval_precision_positive": 0.6314199395770392, | |
| "eval_recall_negative": 0.74394006170119, | |
| "eval_recall_neutral": 0.7438413361169103, | |
| "eval_recall_positive": 0.6031746031746031, | |
| "eval_runtime": 13.4185, | |
| "eval_samples_per_second": 629.354, | |
| "eval_steps_per_second": 3.279, | |
| "step": 3560 | |
| } | |
| ], | |
| "max_steps": 11880, | |
| "num_train_epochs": 10, | |
| "total_flos": 1.849503866686182e+16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |